Skip to content

Commit 78d9910

Browse files
authored
Correct range_n limiting
same bug as seen in #1388, somehow missed in corresponding PR #1389
1 parent 69edc5b commit 78d9910

File tree

1 file changed

+3
-4
lines changed

1 file changed

+3
-4
lines changed

driver/level2/trmv_thread.c

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -346,8 +346,8 @@ int CNAME(BLASLONG m, FLOAT *a, BLASLONG lda, FLOAT *x, BLASLONG incx, FLOAT *bu
346346

347347
range_m[MAX_CPU_NUMBER - num_cpu - 1] = range_m[MAX_CPU_NUMBER - num_cpu] - width;
348348
range_n[num_cpu] = num_cpu * (((m + 15) & ~15) + 16);
349-
if (range_n[num_cpu] > m) range_n[num_cpu] = m;
350-
349+
if (range_n[num_cpu] > m * num_cpu) range_n[num_cpu] = m * num_cpu;
350+
}
351351
queue[num_cpu].mode = mode;
352352
queue[num_cpu].routine = trmv_kernel;
353353
queue[num_cpu].args = &args;
@@ -386,8 +386,7 @@ int CNAME(BLASLONG m, FLOAT *a, BLASLONG lda, FLOAT *x, BLASLONG incx, FLOAT *bu
386386

387387
range_m[num_cpu + 1] = range_m[num_cpu] + width;
388388
range_n[num_cpu] = num_cpu * (((m + 15) & ~15) + 16);
389-
if (range_n[num_cpu] > m) range_n[num_cpu] = m;
390-
389+
if (range_n[num_cpu] > m * num_cpu) range_n[num_cpu] = m * num_cpu;
391390
queue[num_cpu].mode = mode;
392391
queue[num_cpu].routine = trmv_kernel;
393392
queue[num_cpu].args = &args;

0 commit comments

Comments
 (0)