@@ -104,7 +104,7 @@ typedef struct {
104104#define BETA_OPERATION (M_FROM , M_TO , N_FROM , N_TO , BETA , C , LDC ) \
105105 GEMM_BETA((M_TO) - (M_FROM), (N_TO - N_FROM), 0, \
106106 BETA[0], BETA[1], NULL, 0, NULL, 0, \
107- (FLOAT *)(C) + (M_FROM) + (N_FROM) * (LDC) * COMPSIZE, LDC)
107+ (FLOAT *)(C) + (( M_FROM) + (N_FROM) * (LDC) ) * COMPSIZE, LDC)
108108#endif
109109
110110#ifndef ICOPYB_OPERATION
@@ -414,7 +414,7 @@ static int inner_thread(blas_arg_t *args, BLASLONG *range_m, BLASLONG *range_n,
414414
415415 for (jjs = xxx ; jjs < MIN (n_to , xxx + div_n ); jjs += min_jj ){
416416 min_jj = MIN (n_to , xxx + div_n ) - jjs ;
417- if (min_jj > GEMM3M_UNROLL_N ) min_jj = GEMM3M_UNROLL_N ;
417+ if (min_jj > GEMM3M_UNROLL_N * 3 ) min_jj = GEMM3M_UNROLL_N * 3 ;
418418
419419 START_RPCC ();
420420
@@ -550,7 +550,7 @@ static int inner_thread(blas_arg_t *args, BLASLONG *range_m, BLASLONG *range_n,
550550
551551 for (jjs = xxx ; jjs < MIN (n_to , xxx + div_n ); jjs += min_jj ){
552552 min_jj = MIN (n_to , xxx + div_n ) - jjs ;
553- if (min_jj > GEMM3M_UNROLL_N ) min_jj = GEMM3M_UNROLL_N ;
553+ if (min_jj > GEMM3M_UNROLL_N * 3 ) min_jj = GEMM3M_UNROLL_N * 3 ;
554554
555555 START_RPCC ();
556556
@@ -687,7 +687,7 @@ static int inner_thread(blas_arg_t *args, BLASLONG *range_m, BLASLONG *range_n,
687687
688688 for (jjs = xxx ; jjs < MIN (n_to , xxx + div_n ); jjs += min_jj ){
689689 min_jj = MIN (n_to , xxx + div_n ) - jjs ;
690- if (min_jj > GEMM3M_UNROLL_N ) min_jj = GEMM3M_UNROLL_N ;
690+ if (min_jj > GEMM3M_UNROLL_N * 3 ) min_jj = GEMM3M_UNROLL_N * 3 ;
691691
692692 START_RPCC ();
693693
0 commit comments