Issue1388 (#1389)
* Calculation of chunk range limits was ignoring num_cpu bug introduced by me in #1262 - should fix #1388 * Calculation of range limits was ignoring num_cpu bug introduced by me in #1262 * Calculation of chunk range limits was ignoring num_cpu bug introduced by me in #1262 * Calculation of chunk range limits was ignoring num_cpu bug introduced by me in #1262 * Calculation of chunk range limits was ignoring num_cpu bug introduced by me in #1262 * Calculation of chunk range limits was ignoring num_cpu bug introduced by me in #1262
This commit is contained in:
@@ -288,7 +288,7 @@ int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *x, BLASLONG inc
|
||||
|
||||
range_m[MAX_CPU_NUMBER - num_cpu - 1] = range_m[MAX_CPU_NUMBER - num_cpu] - width;
|
||||
range_n[num_cpu] = num_cpu * (((n + 15) & ~15) + 16);
|
||||
if (range_n[num_cpu] > n) range_n[num_cpu] = n;
|
||||
if (range_n[num_cpu] > n * num_cpu) range_n[num_cpu] = n * num_cpu;
|
||||
|
||||
queue[num_cpu].mode = mode;
|
||||
queue[num_cpu].routine = trmv_kernel;
|
||||
@@ -328,7 +328,7 @@ int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *x, BLASLONG inc
|
||||
|
||||
range_m[num_cpu + 1] = range_m[num_cpu] + width;
|
||||
range_n[num_cpu] = num_cpu * (((n + 15) & ~15) + 16);
|
||||
if (range_n[num_cpu] > n) range_n[num_cpu] = n;
|
||||
if (range_n[num_cpu] > n * num_cpu) range_n[num_cpu] = n * num_cpu;
|
||||
|
||||
queue[num_cpu].mode = mode;
|
||||
queue[num_cpu].routine = trmv_kernel;
|
||||
@@ -358,7 +358,7 @@ int CNAME(BLASLONG n, BLASLONG k, FLOAT *a, BLASLONG lda, FLOAT *x, BLASLONG inc
|
||||
|
||||
range_m[num_cpu + 1] = range_m[num_cpu] + width;
|
||||
range_n[num_cpu] = num_cpu * (((n + 15) & ~15) + 16);
|
||||
if (range_n[num_cpu] > n) range_n[num_cpu] = n;
|
||||
if (range_n[num_cpu] > n * num_cpu) range_n[num_cpu] = n * num_cpu;
|
||||
|
||||
queue[num_cpu].mode = mode;
|
||||
queue[num_cpu].routine = trmv_kernel;
|
||||
|
||||
Reference in New Issue
Block a user