Skip to content

Commit

Permalink
perf_test/blas/blas3: Disable simd verify for cuda/10.2.2
Browse files Browse the repository at this point in the history
  • Loading branch information
e10harvey committed Sep 2, 2021
1 parent bc36de8 commit 4a5d013
Showing 1 changed file with 10 additions and 0 deletions.
10 changes: 10 additions & 0 deletions perf_test/blas/blas3/KokkosBlas3_gemm_perf_test.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -1504,6 +1504,12 @@ template <class dstViewType>
static inline void __gemm_copy_simd_view_to_3d_view(gemm_simd_args_t src,
dstViewType dst,
options_t options) {
// clang-format off
// Related issue: https://github.com/kokkos/kokkos-kernels/issues/998
// CUDA VERSION 10.2.2 generates a compiler error:
// KokkosBlas3_gemm_perf_test.hpp: error: ‘h_subview_type_2d’ was not declared in this scope
// clang-format on
#if (CUDA_VERSION != 10020)
using dst_scalar_type = typename dstViewType::value_type;
using src_scalar_type = typename view_type_5d::value_type;
size_t remainder, vector_batch_size, simd_batch_size, last_batch;
Expand Down Expand Up @@ -1631,6 +1637,10 @@ static inline void __gemm_copy_simd_view_to_3d_view(gemm_simd_args_t src,
out:
Kokkos::deep_copy(dst, h_dst);
Kokkos::fence();
#else
Kokkos::abort(
"Cannot perform simd verification with cuda/10.2.2, rerun with -v 0");
#endif // #if (CUDA_VERSION != 10020)
}

/**
Expand Down

0 comments on commit 4a5d013

Please sign in to comment.