Adding conditional compilation(#if defined(LOONGSON3A)) to avoid affecting the performance of other platforms.
This commit is contained in:
		
							parent
							
								
									831858b883
								
							
						
					
					
						commit
						9fe3049de6
					
				| 
						 | 
					@ -71,16 +71,25 @@ int CNAME(int mode, blas_arg_t *arg, BLASLONG *range_m, BLASLONG *range_n, int (
 | 
				
			||||||
    queue[num_cpu].args    = arg;
 | 
					    queue[num_cpu].args    = arg;
 | 
				
			||||||
    queue[num_cpu].range_m = range_m;
 | 
					    queue[num_cpu].range_m = range_m;
 | 
				
			||||||
    queue[num_cpu].range_n = &range[num_cpu];
 | 
					    queue[num_cpu].range_n = &range[num_cpu];
 | 
				
			||||||
    queue[num_cpu].sa      = sa	+ GEMM_OFFSET_A1 * num_cpu;	//NULL;
 | 
					#if defined(LOONGSON3A)
 | 
				
			||||||
    queue[num_cpu].sb      = queue[num_cpu].sa + GEMM_OFFSET_A1 * 5;//NULL;
 | 
					    queue[num_cpu].sa      = sa	+ GEMM_OFFSET_A1 * num_cpu;
 | 
				
			||||||
 | 
					    queue[num_cpu].sb      = queue[num_cpu].sa + GEMM_OFFSET_A1 * 5;
 | 
				
			||||||
 | 
					#else
 | 
				
			||||||
 | 
						queue[num_cpu].sa      = NULL;
 | 
				
			||||||
 | 
					    queue[num_cpu].sb      = NULL;
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
    queue[num_cpu].next    = &queue[num_cpu + 1];
 | 
					    queue[num_cpu].next    = &queue[num_cpu + 1];
 | 
				
			||||||
    num_cpu ++;
 | 
					    num_cpu ++;
 | 
				
			||||||
  }
 | 
					  }
 | 
				
			||||||
  
 | 
					  
 | 
				
			||||||
  if (num_cpu) {
 | 
					  if (num_cpu) {
 | 
				
			||||||
 | 
					#if defined(LOONGSON3A)
 | 
				
			||||||
    queue[0].sa = sa;
 | 
					    queue[0].sa = sa;
 | 
				
			||||||
    queue[0].sb = sa + GEMM_OFFSET_A1 * 5;
 | 
					    queue[0].sb = sa + GEMM_OFFSET_A1 * 5;
 | 
				
			||||||
 | 
					#else
 | 
				
			||||||
 | 
						queue[0].sa = sa;
 | 
				
			||||||
 | 
						queue[0].sb = sb;
 | 
				
			||||||
 | 
					#endif
 | 
				
			||||||
    queue[num_cpu - 1].next = NULL;
 | 
					    queue[num_cpu - 1].next = NULL;
 | 
				
			||||||
    
 | 
					    
 | 
				
			||||||
    exec_blas(num_cpu,
 | 
					    exec_blas(num_cpu,
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
		Loading…
	
		Reference in New Issue