Skip to content

Commit

Permalink
fixup: x64: brgemm matmul: fix tile configuration
Browse files Browse the repository at this point in the history
  • Loading branch information
kwiersch authored and tprimak committed Apr 6, 2023
1 parent d264ba4 commit be942a2
Showing 1 changed file with 4 additions and 2 deletions.
6 changes: 4 additions & 2 deletions src/cpu/x64/matmul/brgemm_matmul.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -135,7 +135,8 @@ status_t brgemm_matmul_t<isa>::pd_t::init(engine_t *engine) {
brgemm_attr_t brgattr;
brgattr.generate_skip_accumulation
= bgmmc_.post_ops_applicable && bgmmc_.nthr_k > 1;
const bool is_amx = is_superset(isa, avx512_core_amx);
constexpr bool is_amx = one_of(
isa, avx512_core_bf16_amx_int8, avx512_core_bf16_amx_bf16);
if (is_amx) {
if (!brgattr.generate_skip_accumulation) {
// TODO: uker doesn't yet support generate_skip_accumulation
Expand Down Expand Up @@ -400,7 +401,8 @@ void brgemm_matmul_t<isa>::maybe_reduce_partial_results_and_apply_postops(
const brg_matmul_exec_ctx_t &brgmm_ctx) const {
if (!brgmm_ctx.parallel_reduction_is_used()) return;

const bool is_amx = is_superset(isa, avx512_core_amx);
constexpr bool is_amx
= one_of(isa, avx512_core_bf16_amx_int8, avx512_core_bf16_amx_bf16);

const auto &bgmmc = pd()->get_brgemm_matmul_conf();
const int num_threads = brgmm_ctx.get_num_threads_for_parallelization();
Expand Down

0 comments on commit be942a2

Please sign in to comment.