diff --git a/driver/others/init.c b/driver/others/init.c index 0cb8c78a21..012ef6647d 100644 --- a/driver/others/init.c +++ b/driver/others/init.c @@ -903,6 +903,7 @@ void gotoblas_affinity_init(void) { } #else common->num_procs = CPU_COUNT(sizeof(cpu_set_t),cpusetp); + } #endif #endif diff --git a/driver/others/memory.c b/driver/others/memory.c index e4caa093ab..1d5b70003f 100644 --- a/driver/others/memory.c +++ b/driver/others/memory.c @@ -177,7 +177,7 @@ int get_num_procs(void) { cpu_set_t *cpusetp; size_t size; int ret; -int i,n; +// int i,n; if (!nums) nums = sysconf(_SC_NPROCESSORS_CONF); #if !defined(OS_LINUX) diff --git a/kernel/generic/laswp_ncopy_2.c b/kernel/generic/laswp_ncopy_2.c index a29562df9a..32dbf871b6 100644 --- a/kernel/generic/laswp_ncopy_2.c +++ b/kernel/generic/laswp_ncopy_2.c @@ -116,7 +116,7 @@ int CNAME(BLASLONG n, BLASLONG k1, BLASLONG k2, FLOAT *a, BLASLONG lda, blasint *b2 = A2; *b4 = A4; } - } else + } else { if (b1 == a2) { if (b2 == a2) { *(buffer + 0) = A2; @@ -139,7 +139,7 @@ int CNAME(BLASLONG n, BLASLONG k1, BLASLONG k2, FLOAT *a, BLASLONG lda, blasint *(buffer + 3) = A4; *b1 = A1; *b3 = A3; - } else + } else { if (b2 == b1) { *(buffer + 0) = B1; *(buffer + 1) = B3; @@ -157,6 +157,8 @@ int CNAME(BLASLONG n, BLASLONG k1, BLASLONG k2, FLOAT *a, BLASLONG lda, blasint *b3 = A3; *b4 = A4; } + } + } } buffer += 4; diff --git a/kernel/generic/trmm_ltcopy_2.c b/kernel/generic/trmm_ltcopy_2.c index 13a3bc53ce..60cdeed1c3 100644 --- a/kernel/generic/trmm_ltcopy_2.c +++ b/kernel/generic/trmm_ltcopy_2.c @@ -120,30 +120,18 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON ao2 += 1; */ b += 2; } else +#ifdef UNIT if (X < posY) { - data01 = *(ao1 + 0); - data02 = *(ao1 + 1); - - b[ 0] = data01; - b[ 1] = data02; - // ao1 += lda; - b += 2; - } else { +#endif + b[ 0] = *(ao1 + 0); #ifdef UNIT - data02 = *(ao1 + 1); + } else { b[ 0] = ONE; - b[ 1] = data02; -#else - data01 = *(ao1 + 0); - data02 = *(ao1 + 1); - - b[ 0] = data01; - b[ 1] = data02; -#endif - // ao1 += 2; - b += 2; } +#endif + b[ 1] = *(ao1 + 1); + b += 2; } posY += 2; diff --git a/kernel/generic/trmm_ltcopy_4.c b/kernel/generic/trmm_ltcopy_4.c index 128536aad5..e90d892096 100644 --- a/kernel/generic/trmm_ltcopy_4.c +++ b/kernel/generic/trmm_ltcopy_4.c @@ -410,36 +410,17 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON i = (m & 1); if (i) { - - if (X > posY) { - /* ao1 += 1; - ao2 += 1; */ - - b += 2; - } else - if (X < posY) { - data01 = *(ao1 + 0); - data02 = *(ao1 + 1); - - b[ 0] = data01; - b[ 1] = data02; - // ao1 += lda; - b += 2; - } else { #ifdef UNIT - data02 = *(ao1 + 1); - - b[ 0] = ONE; - b[ 1] = data02; -#else - data01 = *(ao1 + 0); - data02 = *(ao1 + 1); - - b[ 0] = data01; - b[ 1] = data02; + if (X < posY) { #endif - b += 2; - } + b[ 0] = *(ao1 + 0); +#ifdef UNIT + } else { + b[ 0] = ONE; + } +#endif + b[ 1] = *(ao1 + 1); + b += 2; } posY += 2; } diff --git a/kernel/generic/trmm_utcopy_16.c b/kernel/generic/trmm_utcopy_16.c index 5d0f7dd2e2..12642e7db6 100644 --- a/kernel/generic/trmm_utcopy_16.c +++ b/kernel/generic/trmm_utcopy_16.c @@ -1487,23 +1487,19 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON if (X < posY) { a01 ++; a02 ++; - b += 2; - } else + } else { +#ifdef UNIT if (X > posY) { +#endif b[ 0] = *(a01 + 0); - b[ 1] = *(a01 + 1); - // a01 += lda; - b += 2; - } else { #ifdef UNIT + } else { b[ 0] = ONE; - b[ 1] = *(a01 + 1); -#else - b[ 0] = *(a01 + 0); - b[ 1] = *(a01 + 1); -#endif - b += 2; } +#endif + b[ 1] = *(a01 + 1); + } + b += 2; } posY += 2; } @@ -1522,25 +1518,22 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON if (i > 0) { do { if (X < posY) { - a01 += 1; - b ++; - } else + a01 ++; + } else { +#ifdef UNIT if (X > posY) { +#endif b[ 0] = *(a01 + 0); - a01 += lda; - b ++; - } else { #ifdef UNIT + } else { b[ 0] = ONE; -#else - b[ 0] = *(a01 + 0); -#endif - a01 += lda; - b ++; } - - X += 1; - i --; +#endif + a01 += lda; + } + b ++; + X ++; + i --; } while (i > 0); } // posY += 1; diff --git a/kernel/generic/trmm_utcopy_2.c b/kernel/generic/trmm_utcopy_2.c index efa68162cf..75076c3822 100644 --- a/kernel/generic/trmm_utcopy_2.c +++ b/kernel/generic/trmm_utcopy_2.c @@ -161,27 +161,18 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON i = m; if (m > 0) { do { - if (X < posY) { - b += 1; - ao1 += 1; - } else - if (X > posY) { - data01 = *(ao1 + 0); - b[ 0] = data01; - b += 1; - ao1 += lda; - } else { #ifdef UNIT - b[ 0] = ONE; -#else - data01 = *(ao1 + 0); - b[ 0] = data01; + if (X > posY) { #endif - b += 1; - ao1 += lda; - } - - X += 1; + b[ 0] = *(ao1 + 0); +#ifdef UNIT + } else { + b[ 0] = ONE; + } +#endif + b ++; + ao1 += lda; + X ++; i --; } while (i > 0); } diff --git a/kernel/generic/trmm_utcopy_4.c b/kernel/generic/trmm_utcopy_4.c index 3e7726b61d..e5844094e5 100644 --- a/kernel/generic/trmm_utcopy_4.c +++ b/kernel/generic/trmm_utcopy_4.c @@ -443,26 +443,21 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON do { if (X < posY) { - b += 1; ao1 += 1; - } else + } else { +#ifdef UNIT if (X > posY) { - data01 = *(ao1 + 0); - b[ 0] = data01; - ao1 += lda; - b += 1; - } else { +#endif + b[ 0] = *(ao1 + 0); #ifdef UNIT + } else { b[ 0] = ONE; -#else - data01 = *(ao1 + 0); - b[ 0] = data01; -#endif - ao1 += lda; - b += 1; } - - X += 1; +#endif + ao1 += lda; + } + b ++; + X ++; i --; } while (i > 0); } diff --git a/kernel/generic/trmmkernel_16x2.c b/kernel/generic/trmmkernel_16x2.c index 078a91dd56..8e96edf854 100644 --- a/kernel/generic/trmmkernel_16x2.c +++ b/kernel/generic/trmmkernel_16x2.c @@ -52,6 +52,8 @@ int CNAME(BLASLONG bm,BLASLONG bn,BLASLONG bk,FLOAT alpha,FLOAT* ba,FLOAT* bb,FL #if !defined(LEFT) off = -offset; +#else + off = 0; #endif diff --git a/kernel/generic/trmmkernel_2x2.c b/kernel/generic/trmmkernel_2x2.c index 40fbeeabb5..05fe1876cc 100644 --- a/kernel/generic/trmmkernel_2x2.c +++ b/kernel/generic/trmmkernel_2x2.c @@ -11,6 +11,8 @@ int CNAME(BLASLONG bm,BLASLONG bn,BLASLONG bk,FLOAT alpha,FLOAT* ba,FLOAT* bb,FL BLASLONG off, temp; #if defined(TRMMKERNEL) && !defined(LEFT) off = -offset; +#else + off = 0; #endif for (j=0; j 0); } diff --git a/kernel/generic/zlaswp_ncopy_4.c b/kernel/generic/zlaswp_ncopy_4.c index 192494b071..0de393838f 100644 --- a/kernel/generic/zlaswp_ncopy_4.c +++ b/kernel/generic/zlaswp_ncopy_4.c @@ -462,7 +462,7 @@ int CNAME(BLASLONG n, BLASLONG k1, BLASLONG k2, FLOAT *a, BLASLONG lda, blasint *(b4 + 0) = A7; *(b4 + 1) = A8; } - } else + } else { if (b1 == a2) { if (b2 == a2) { *(buffer + 0) = A3; @@ -503,7 +503,7 @@ int CNAME(BLASLONG n, BLASLONG k1, BLASLONG k2, FLOAT *a, BLASLONG lda, blasint *(b1 + 1) = A2; *(b3 + 0) = A5; *(b3 + 1) = A6; - } else + } else { if (b2 == b1) { *(buffer + 0) = B1; *(buffer + 1) = B2; @@ -536,6 +536,8 @@ int CNAME(BLASLONG n, BLASLONG k1, BLASLONG k2, FLOAT *a, BLASLONG lda, blasint *(b4 + 0) = A7; *(b4 + 1) = A8; } + } + } } buffer += 8; diff --git a/kernel/generic/ztrmm_ltcopy_2.c b/kernel/generic/ztrmm_ltcopy_2.c index deb675f733..7969f4f3db 100644 --- a/kernel/generic/ztrmm_ltcopy_2.c +++ b/kernel/generic/ztrmm_ltcopy_2.c @@ -139,48 +139,18 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON } if (m & 1) { - - if (X > posY) { - /* ao1 += 2; - ao2 += 2; */ - b += 4; - - } else +#ifdef UNIT if (X < posY) { - data1 = *(ao1 + 0); - data2 = *(ao1 + 1); - data3 = *(ao1 + 2); - data4 = *(ao1 + 3); - - b[ 0] = data1; - b[ 1] = data2; - b[ 2] = data3; - b[ 3] = data4; - - // ao1 += lda; - b += 4; - } else { +#endif + b[ 0] = *(ao1 + 0); + b[ 1] = *(ao1 + 1); #ifdef UNIT - data3 = *(ao1 + 2); - data4 = *(ao1 + 3); - + } else { b[ 0] = ONE; b[ 1] = ZERO; - b[ 2] = data3; - b[ 3] = data4; -#else - data1 = *(ao1 + 0); - data2 = *(ao1 + 1); - data3 = *(ao1 + 2); - data4 = *(ao1 + 3); - - b[ 0] = data1; - b[ 1] = data2; - b[ 2] = data3; - b[ 3] = data4; -#endif - b += 4; } +#endif + b += 4; } posY += 2; diff --git a/kernel/generic/ztrmm_utcopy_1.c b/kernel/generic/ztrmm_utcopy_1.c index 2746c5f5c3..94d23ef9b3 100644 --- a/kernel/generic/ztrmm_utcopy_1.c +++ b/kernel/generic/ztrmm_utcopy_1.c @@ -44,7 +44,7 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON BLASLONG i, js; BLASLONG X; - FLOAT data01, data02; +// FLOAT data01, data02; FLOAT *ao1; lda += lda; @@ -65,30 +65,21 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON do { if (X < posY) { ao1 += 2; - b += 2; - } else + } else { +#ifdef UNIT if (X > posY) { - data01 = *(ao1 + 0); - data02 = *(ao1 + 1); - b[ 0] = data01; - b[ 1] = data02; - ao1 += lda; - b += 2; - - } else { +#endif + b[ 0] = *(ao1 + 0); + b[ 1] = *(ao1 + 1); #ifdef UNIT + } else { b[ 0] = ONE; b[ 1] = ZERO; -#else - data01 = *(ao1 + 0); - data02 = *(ao1 + 1); - b[ 0] = data01; - b[ 1] = data02; -#endif - ao1 += lda; - b += 2; } - +#endif + ao1 += lda; + } + b += 2; X ++; i --; } while (i > 0); diff --git a/kernel/generic/ztrmm_utcopy_2.c b/kernel/generic/ztrmm_utcopy_2.c index 6c7288ae92..03ce93d993 100644 --- a/kernel/generic/ztrmm_utcopy_2.c +++ b/kernel/generic/ztrmm_utcopy_2.c @@ -203,33 +203,22 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON do { if (X < posY) { ao1 += 2; - b += 2; - } else + } else { +#ifdef UNIT if (X > posY) { - data1 = *(ao1 + 0); - data2 = *(ao1 + 1); - - b[ 0] = data1; - b[ 1] = data2; - - ao1 += lda; - b += 2; - } else { +#endif + b[ 0] = *(ao1 + 0); + b[ 1] = *(ao1 + 1); #ifdef UNIT + } else { b[ 0] = ONE; b[ 1] = ZERO; -#else - data1 = *(ao1 + 0); - data2 = *(ao1 + 1); - - b[ 0] = data1; - b[ 1] = data2; -#endif - ao1 += lda; - b += 2; } - - X += 1; +#endif + ao1 += lda; + } + b += 2; + X ++; i --; } while (i > 0); } diff --git a/kernel/generic/ztrmm_utcopy_8.c b/kernel/generic/ztrmm_utcopy_8.c index ed4578579e..946c136e79 100644 --- a/kernel/generic/ztrmm_utcopy_8.c +++ b/kernel/generic/ztrmm_utcopy_8.c @@ -856,25 +856,22 @@ int CNAME(BLASLONG m, BLASLONG n, FLOAT *a, BLASLONG lda, BLASLONG posX, BLASLON do { if (X < posY) { a01 += 2; - b += 2; - } else + } else { +#ifdef UNIT if (X > posY) { +#endif b[ 0] = *(a01 + 0); b[ 1] = *(a01 + 1); - a01 += lda; - b += 2; - } else { #ifdef UNIT + } else { b[ 0] = ONE; b[ 1] = ZERO; -#else - b[ 0] = *(a01 + 0); - b[ 1] = *(a01 + 1); -#endif - a01 += lda; - b += 2; } - X += 1; +#endif + a01 += lda; + } + b += 2; + X ++; i --; } while (i > 0); } diff --git a/kernel/generic/ztrmmkernel_2x2.c b/kernel/generic/ztrmmkernel_2x2.c index ecb2a97cd5..88e7197e4f 100644 --- a/kernel/generic/ztrmmkernel_2x2.c +++ b/kernel/generic/ztrmmkernel_2x2.c @@ -15,6 +15,8 @@ int CNAME(BLASLONG bm,BLASLONG bn,BLASLONG bk,FLOAT alphar,FLOAT alphai,FLOAT* b #if defined(TRMMKERNEL) && !defined(LEFT) off = -offset; +#else + off = 0; #endif for (j=0; j