@@ -685,18 +685,6 @@ struct jit_brgemm_kernel_post_ops : public jit_generator {
685685
686686 if (req_comp) maybe_apply_comp (m_block, n_block, tail);
687687
688- if (brg.beta != 0 && jcp.with_bias ) {
689- for (int n = 0 ; n < n_block; n++) {
690- auto vmm_bias = vmm_tmp (0 );
691- auto bias_addr = ptr[aux_reg_bias
692- + bia_typesize_ * (n * brg.ld_block )];
693- cvt2ps (bia_dt_, vmm_bias, bias_addr, tail, false , k_mask);
694- for (int m = 0 ; m < m_block; m++) {
695- vaddps (vector (m, n), vmm_bias);
696- }
697- }
698- }
699-
700688 if (brg.beta != 0 ) {
701689 for_ (int m = 0 ; m < m_block; m++)
702690 for (int n = 0 ; n < n_block; n++) {
@@ -714,6 +702,18 @@ struct jit_brgemm_kernel_post_ops : public jit_generator {
714702 }
715703 }
716704
705+ if (brg.beta != 0 && jcp.with_bias ) {
706+ for (int n = 0 ; n < n_block; n++) {
707+ auto vmm_bias = vmm_tmp (0 );
708+ auto bias_addr = ptr[aux_reg_bias
709+ + bia_typesize_ * (n * brg.ld_block )];
710+ cvt2ps (bia_dt_, vmm_bias, bias_addr, tail, false , k_mask);
711+ for (int m = 0 ; m < m_block; m++) {
712+ vaddps (vector (m, n), vmm_bias);
713+ }
714+ }
715+ }
716+
717717 if (postops_injector_) inject_attr_postops (m_block, n_block, tail);
718718
719719 if (brg.beta != 0 && brg.zp_type_c != brgemm_broadcast_t ::none) {
0 commit comments