@@ -467,13 +467,15 @@ status_t brgemm_matmul_conf_utils_t::set_or_check_B_tag(memory_desc_t &B_md,
467467 bgmmc.wei_tag = blocked_B_layouts_allowed && !bgmmc.is_runtime_N
468468 && !bgmmc.is_int4_weights
469469 ? memory_desc_matches_one_of_tag (B_md,
470- plain_tensor_layout_tag,
471- transposed_tensor_layout_tag,
472- blocked_64n_B_layout_tag, blocked_48n_B_layout_tag,
473- blocked_32n_B_layout_tag, blocked_16n_B_layout_tag)
470+ plain_tensor_layout_tag,
471+ transposed_tensor_layout_tag,
472+ blocked_64n_B_layout_tag,
473+ blocked_48n_B_layout_tag,
474+ blocked_32n_B_layout_tag,
475+ blocked_16n_B_layout_tag)
474476 : memory_desc_matches_one_of_tag (B_md,
475- plain_tensor_layout_tag,
476- transposed_tensor_layout_tag, acbd, adbc);
477+ plain_tensor_layout_tag,
478+ transposed_tensor_layout_tag, acbd, adbc);
477479 const bool plain_transposed_matched
478480 = memory_desc_matches_tag (B_md, plain_tensor_layout_tag)
479481 && memory_desc_matches_tag (
@@ -545,15 +547,16 @@ status_t brgemm_matmul_conf_utils_t::set_or_check_tags(memory_desc_t &A_md,
545547 || this ->is_f16_with_int_wei () || this ->is_tf32 ()
546548 || this ->is_f32_with_int_wei ())
547549 && !xf16_avx2_vnni_2;
548- bgmmc.src_tag = is_adbc_allowed ? memory_desc_matches_one_of_tag (
549- A_md, plain_tensor_layout_tag,
550- transposed_tensor_layout_tag, acbd, adbc)
550+ bgmmc.src_tag = is_adbc_allowed
551+ ? memory_desc_matches_one_of_tag (A_md,
552+ plain_tensor_layout_tag,
553+ transposed_tensor_layout_tag, acbd, adbc)
551554 : is_int8_avx512_core
552555 ? memory_desc_matches_one_of_tag (A_md,
553- plain_tensor_layout_tag,
554- transposed_tensor_layout_tag, acbd)
556+ plain_tensor_layout_tag,
557+ transposed_tensor_layout_tag, acbd)
555558 : memory_desc_matches_one_of_tag (
556- A_md, plain_tensor_layout_tag, acbd);
559+ A_md, plain_tensor_layout_tag, acbd);
557560 if (bgmmc.src_tag == format_tag::undef
558561 || (memory_desc_matches_tag (
559562 A_md, transposed_tensor_layout_tag)
@@ -655,8 +658,7 @@ format_tag_t brgemm_matmul_conf_utils_t::pick_blocked_B_layout(
655658 const bool is_amx_or_avx2_vnni_2 = is_superset (bgmmc.isa , avx512_core_amx)
656659 || is_superset (bgmmc.isa , avx2_vnni_2);
657660 const bool prefer_amx_or_avx2_vnni_2 = is_f16 () || is_f32_f16 ()
658- || is_f32_bf16 () || is_f16_with_int_wei ()
659- || is_f32_with_int_wei ();
661+ || is_f32_bf16 () || is_f16_with_int_wei () || is_f32_with_int_wei ();
660662
661663 if ((prefer_amx_or_avx2_vnni_2 && is_amx_or_avx2_vnni_2) || is_bf16 ()
662664 || is_bf16_with_int_wei ()) {
@@ -672,8 +674,7 @@ format_tag_t brgemm_matmul_conf_utils_t::pick_blocked_B_layout(
672674 // Note: bf32 assumes f32 blocking
673675 if (is_f32 () || is_bf32 () || is_f16 () || is_f32_f16 () || is_f32_bf16 ()
674676 || is_f16_with_int_wei () || is_tf32 ()
675- || (is_f32_with_int_wei ()
676- && is_superset (bgmmc.isa , avx512_core))) {
677+ || (is_f32_with_int_wei () && is_superset (bgmmc.isa , avx512_core))) {
677678 switch (n_blk) {
678679 case 64 : return bgmmc.ndims == 3 ? aCB16b64c : BA16a64b;
679680 case 48 : return bgmmc.ndims == 3 ? aCB16b48c : BA16a48b;
@@ -1262,9 +1263,9 @@ status_t compute_blocking_heuristic(brgemm_matmul_conf_t &bgmmc,
12621263
12631264 const float best_imbalance = is_f32
12641265 ? compute_blocking_heuristic_avx2_f32 (
1265- bgmmc, bm_conf_utils, matmul, best_blocking)
1266+ bgmmc, bm_conf_utils, matmul, best_blocking)
12661267 : compute_blocking_heuristic_avx2 (
1267- bgmmc, bm_conf_utils, matmul, best_blocking);
1268+ bgmmc, bm_conf_utils, matmul, best_blocking);
12681269
12691270 VCONDCHECK_BG (best_imbalance != 1 .f , VERBOSE_BLOCKING_FAIL, " " )
12701271
@@ -1748,9 +1749,9 @@ status_t init_brgemm_matmul_conf(cpu_isa_t isa, brgemm_matmul_conf_t &bgmmc,
17481749 bgmmc.N_tail = bgmmc.is_runtime_N ? 0 : bgmmc.N % bgmmc.N_blk ;
17491750 bgmmc.K_tail = bgmmc.K > bgmmc.K_blk
17501751 ? ((bgmmc.extendable_k || bgmmc.use_fused_copy_a )
1751- ? bgmmc.K % bgmmc.K_blk
1752- : rnd_up (bgmmc.K % bgmmc.K_blk ,
1753- bgmmc.required_k_granularity ))
1752+ ? bgmmc.K % bgmmc.K_blk
1753+ : rnd_up (bgmmc.K % bgmmc.K_blk ,
1754+ bgmmc.required_k_granularity ))
17541755 : 0 ;
17551756
17561757 bgmmc.LDB = bm_conf_utils.get_actual_LDB ();
0 commit comments