Calculation of chunk range limits was ignoring num_cpu
bug introduced by me in #1262 - should fix #1388
This commit is contained in:
parent
281a2b952f
commit
e90a147493
|
@ -230,10 +230,10 @@ int CNAME(BLASLONG m, BLASLONG n, BLASLONG ku, BLASLONG kl, FLOAT *alpha, FLOAT
|
||||||
|
|
||||||
#ifndef TRANSA
|
#ifndef TRANSA
|
||||||
range_m[num_cpu] = num_cpu * ((m + 15) & ~15);
|
range_m[num_cpu] = num_cpu * ((m + 15) & ~15);
|
||||||
if (range_m[num_cpu] > m) range_m[num_cpu] = m;
|
if (range_m[num_cpu] > m * num_cpu) range_m[num_cpu] = m * num_cpu;
|
||||||
#else
|
#else
|
||||||
range_m[num_cpu] = num_cpu * ((n + 15) & ~15);
|
range_m[num_cpu] = num_cpu * ((n + 15) & ~15);
|
||||||
if (range_m[num_cpu] > n) range_m[num_cpu] = n;
|
if (range_m[num_cpu] > n * num_cpu) range_m[num_cpu] = n * num_cpu;
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
queue[num_cpu].mode = mode;
|
queue[num_cpu].mode = mode;
|
||||||
|
|
Loading…
Reference in New Issue