void ATL_creftrmmLUCN ( const int M, const int N, const float * ALPHA, const float * A, const int LDA, float * B, const int LDB ) { /* * Purpose * ======= * * ATL_creftrmmLUCN( ... ) * * <=> * * ATL_creftrmm * ( AtlasLeft, AtlasUpper, AtlasConjTrans, AtlasNonUnit, ... ) * * See ATL_creftrmm for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ float t0_i, t0_r; int i, iaki, ibij, ibkj, j, jai, jbj, k, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jbj = 0; j < N; j++, jbj += ldb2 ) { for( i = M-1, jai = (M-1)*lda2, ibij = ((M-1)<<1)+jbj; i >= 0; i--, jai -= lda2, ibij -= 2 ) { Mset( B[ibij], B[ibij+1], t0_r, t0_i ); k = ( i << 1 ) + jai; Msscl( A[k], -A[k+1], t0_r, t0_i ); for( k = 0, iaki = jai, ibkj = jbj; k < i; k++, iaki += 2, ibkj += 2 ) { Mmla( A[iaki], -A[iaki+1], B[ibkj], B[ibkj+1], t0_r, t0_i ); } Mmul( ALPHA[0], ALPHA[1], t0_r, t0_i, B[ibij], B[ibij+1] ); } } /* * End of ATL_creftrmmLUCN */ }
void ATL_creftrsmLLTU ( const int M, const int N, const float * ALPHA, const float * A, const int LDA, float * B, const int LDB ) { /* * Purpose * ======= * * ATL_creftrsmLLTU( ... ) * * <=> * * ATL_creftrsm * ( AtlasLeft, AtlasLower, AtlasTrans, AtlasUnit, ... ) * * See ATL_creftrsm for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register float t0_i, t0_r; int i, iaki, ibij, ibkj, j, jai, jbj, k, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jbj = 0; j < N; j++, jbj += ldb2 ) { for( i = M-1, jai = (M-1)*lda2, ibij = ((M-1) << 1)+jbj; i >= 0; i--, jai -= lda2, ibij -= 2 ) { Mmul( ALPHA[0], ALPHA[1], B[ibij], B[ibij+1], t0_r, t0_i ); for( k = i+1, iaki = ((i+1) << 1)+jai, ibkj = ((i+1) << 1)+jbj; k < M; k++, iaki += 2, ibkj += 2 ) { Mmls( A[iaki], A[iaki+1], B[ibkj], B[ibkj+1], t0_r, t0_i ); } Mset( t0_r, t0_i, B[ibij], B[ibij+1] ); } } /* * End of ATL_creftrsmLLTU */ }
void ATL_zreftrmmLLNU ( const int M, const int N, const double * ALPHA, const double * A, const int LDA, double * B, const int LDB ) { /* * Purpose * ======= * * ATL_zreftrmmLLNU( ... ) * * <=> * * ATL_zreftrmm * ( AtlasLeft, AtlasLower, AtlasNoTrans, AtlasUnit, ... ) * * See ATL_zreftrmm for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ double t0_i, t0_r; int i, iaik, ibij, ibkj, j, jak, jbj, k, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jbj = 0; j < N; j++, jbj += ldb2 ) { for( k = M-1, jak = (M-1)*lda2, ibkj = ((M-1)<<1)+jbj; k >= 0; k--, jak -= lda2, ibkj -= 2 ) { Mmul( ALPHA[0], ALPHA[1], B[ibkj], B[ibkj+1], t0_r, t0_i ); Mset( t0_r, t0_i, B[ibkj], B[ibkj+1] ); for( i = k+1, iaik = ((k+1)<<1)+jak, ibij = ((k+1)<<1)+jbj; i < M; i++, iaik += 2, ibij += 2 ) { Mmla( t0_r, t0_i, A[iaik], A[iaik+1], B[ibij], B[ibij+1] ); } } } /* * End of ATL_zreftrmmLLNU */ }
void ATL_crefgpmvLC ( const int M, const int N, const float * ALPHA, const float * A, const int LDA, const float * X, const int INCX, const float * BETA, float * Y, const int INCY ) { /* * Purpose * ======= * * ATL_crefgpmvLC( ... ) * * <=> * * ATL_crefgpmv( AtlasLower, AtlasConj, ... ) * * See ATL_crefgpmv for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register float t0_i, t0_r; int i, iaij, incx2 = 2 * INCX, incy2 = 2 * INCY, iy, j, jaj, jx, lda2 = ( LDA << 1 ); /* .. * .. Executable Statements .. * */ Mcvscal( M, BETA, Y, INCY ); for( j = 0, jaj = 0, jx = 0; j < N; j++, jx += incx2 ) { Mmul( ALPHA[0], ALPHA[1], X[jx], X[jx+1], t0_r, t0_i ); for( i = 0, iaij = jaj, iy = 0; i < M; i++, iaij += 2, iy += incy2 ) { Mmla( A[iaij], -A[iaij+1], t0_r, t0_i, Y[iy], Y[iy+1] ); } lda2 -= 2; jaj += lda2; } /* * End of ATL_crefgpmvLC */ }
void ATL_crefsyrkLN ( const int N, const int K, const float * ALPHA, const float * A, const int LDA, const float * BETA, float * C, const int LDC ) { /* * Purpose * ======= * * ATL_crefsyrkLN( ... ) * * <=> * * ATL_crefsyrk( AtlasLower, AtlasNoTrans, ... ) * * See ATL_crefsyrk for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register float t0_i, t0_r; int i, iail, iaj, iajl, icij, j, jal, jcj, l, lda2 = ( LDA << 1 ), ldc2 = ( LDC << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, iaj = 0, jcj = 0; j < N; j++, iaj += 2, jcj += ldc2 ) { Mcvscal( N-j, BETA, C+(j << 1)+jcj, 1 ); for( l = 0, iajl = iaj, jal = 0; l < K; l++, iajl += lda2, jal += lda2 ) { Mmul( ALPHA[0], ALPHA[1], A[iajl], A[iajl+1], t0_r, t0_i ); for( i = j, iail = (j << 1)+jal, icij = (j << 1)+jcj; i < N; i++, iail += 2, icij += 2 ) { Mmla( t0_r, t0_i, A[iail], A[iail+1], C[icij], C[icij+1] ); } } } /* * End of ATL_crefsyrkLN */ }
void ATL_creftrsmLUTN ( const int M, const int N, const float * ALPHA, const float * A, const int LDA, float * B, const int LDB ) { /* * Purpose * ======= * * ATL_creftrsmLUTN( ... ) * * <=> * * ATL_creftrsm * ( AtlasLeft, AtlasUpper, AtlasTrans, AtlasNonUnit, ... ) * * See ATL_creftrsm for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register float t0_i, t0_r; int i, iaki, ibij, ibkj, j, jai, jbj, k, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jbj = 0; j < N; j++, jbj += ldb2 ) { for( i = 0, jai = 0, ibij = jbj; i < M; i++, jai += lda2, ibij += 2 ) { Mmul( ALPHA[0], ALPHA[1], B[ibij], B[ibij+1], t0_r, t0_i ); for( k = 0, iaki = jai, ibkj = jbj; k < i; k++, iaki += 2, ibkj += 2 ) { Mmls( A[iaki], A[iaki+1], B[ibkj], B[ibkj+1], t0_r, t0_i ); } k = ( i << 1 ) + jai; Msdiv( A[k], A[k+1], t0_r, t0_i ); Mset( t0_r, t0_i, B[ibij], B[ibij+1] ); } } /* * End of ATL_creftrsmLUTN */ }
void ATL_zreftrmmLLCU ( const int M, const int N, const double * ALPHA, const double * A, const int LDA, double * B, const int LDB ) { /* * Purpose * ======= * * ATL_zreftrmmLLCU( ... ) * * <=> * * ATL_zreftrmm * ( AtlasLeft, AtlasLower, AtlasConjTrans, AtlasUnit, ... ) * * See ATL_zreftrmm for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ double t0_i, t0_r; int i, iaki, ibij, ibkj, j, jai, jbj, k, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jbj = 0; j < N; j++, jbj += ldb2 ) { for( i = 0, jai = 0, ibij = jbj; i < M; i++, jai += lda2, ibij += 2 ) { Mset( B[ibij], B[ibij+1], t0_r, t0_i ); for( k = i+1, iaki = ((i+1)<<1)+jai, ibkj = ((i+1)<<1)+jbj; k < M; k++, iaki += 2, ibkj += 2 ) { Mmla( A[iaki], -A[iaki+1], B[ibkj], B[ibkj+1], t0_r, t0_i ); } Mmul( ALPHA[0], ALPHA[1], t0_r, t0_i, B[ibij], B[ibij+1] ); } } /* * End of ATL_zreftrmmLLCU */ }
void ATL_zrefsyrkUN ( const int N, const int K, const double * ALPHA, const double * A, const int LDA, const double * BETA, double * C, const int LDC ) { /* * Purpose * ======= * * ATL_zrefsyrkUN( ... ) * * <=> * * ATL_zrefsyrk( AtlasUpper, AtlasNoTrans, ... ) * * See ATL_zrefsyrk for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register double t0_i, t0_r; int i, iail, iaj, iajl, icij, j, jal, jcj, l, lda2 = ( LDA << 1 ), ldc2 = ( LDC << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, iaj = 0, jcj = 0; j < N; j++, iaj += 2, jcj += ldc2 ) { Mzvscal( j+1, BETA, C+jcj, 1 ); for( l = 0, iajl = iaj, jal = 0; l < K; l++, iajl += lda2, jal += lda2 ) { Mmul( ALPHA[0], ALPHA[1], A[iajl], A[iajl+1], t0_r, t0_i ); for( i = 0, iail = jal, icij = jcj; i <= j; i++, iail += 2, icij += 2 ) { Mmla( t0_r, t0_i, A[iail], A[iail+1], C[icij], C[icij+1] ); } } } /* * End of ATL_zrefsyrkUN */ }
void ATL_creftbmvUNN ( const int N, const int K, const float * A, const int LDA, float * X, const int INCX ) { /* * Purpose * ======= * * ATL_creftbmvUNN( ... ) * * <=> * * ATL_creftbmv( AtlasUpper, AtlasNoTrans, AtlasNonUnit, ... ) * * See ATL_creftbmv for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register float t0_i, t0_r; int i, i0, iaij, incx2 = 2 * INCX, ix, j, jaj, jx, kx = 0, l, lda2 = ( LDA << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jaj = 0, jx = kx; j < N; j++, jaj += lda2, jx += incx2 ) { Mset( X[jx], X[jx+1], t0_r, t0_i ); l = K - j; i0 = ( j - K > 0 ? j - K : 0 ); for( i = i0, iaij = ((l+i0) << 1)+jaj, ix = kx; i < j; i++, iaij += 2, ix += incx2 ) { Mmla( A[iaij], A[iaij+1], t0_r, t0_i, X[ix] , X[ix+1] ); } Mmul( A[iaij], A[iaij+1], t0_r, t0_i, X[jx] , X[jx+1] ); if( j >= K ) { kx += incx2; } } /* * End of ATL_creftbmvUNN */ }
void ATL_creftbmvLTN ( const int N, const int K, const float * A, const int LDA, float * X, const int INCX ) { /* * Purpose * ======= * * ATL_creftbmvLTN( ... ) * * <=> * * ATL_creftbmv( AtlasLower, AtlasTrans, AtlasNonUnit, ... ) * * See ATL_creftbmv for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register float t0_i, t0_r; int i, i1, iaij, incx2 = 2 * INCX, ix, j, jaj, jx, kx = 0, lda2 = ( LDA << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jaj = 0, jx = kx; j < N; j++, jaj += lda2, jx += incx2 ) { Mmul( A[jaj], A[jaj+1], X[jx] , X[jx+1], t0_r, t0_i ); i1 = ( N - 1 > j + K ? j + K : N - 1 ); for( i = j+1, iaij = 2+jaj, ix = jx + incx2; i <= i1; i++, iaij += 2, ix += incx2 ) { Mmla( A[iaij], A[iaij+1], X[ix] , X[ix+1], t0_r, t0_i ); } Mset( t0_r, t0_i, X[jx], X[jx+1] ); } /* * End of ATL_creftbmvLTN */ }
void ATL_zrefgemvN ( const int M, const int N, const double * ALPHA, const double * A, const int LDA, const double * X, const int INCX, const double * BETA, double * Y, const int INCY ) { /* * Purpose * ======= * * ATL_zrefgemvN( ... ) <=> ATL_zrefgemv( AtlasNoTrans, ... ) * * See ATL_zrefgemv for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register double t0_i, t0_r; int i, iaij, iy, j, jaj, jx; int incx2 = 2 * INCX, incy2 = 2 * INCY, lda2 = ( LDA << 1 ); /* .. * .. Executable Statements .. * */ Mzvscal( M, BETA, Y, INCY ); for( j = 0, jaj = 0, jx = 0; j < N; j++, jaj += lda2, jx += incx2 ) { Mmul( ALPHA[0], ALPHA[1], X[jx], X[jx+1], t0_r, t0_i ); for( i = 0, iaij = jaj, iy = 0; i < M; i++, iaij += 2, iy += incy2 ) { Mmla( A[iaij], A[iaij+1], t0_r, t0_i, Y[iy], Y[iy+1] ); } } /* * End of ATL_zrefgemvN */ }
void ATL_creftrmvLHN ( const int N, const float * A, const int LDA, float * X, const int INCX ) { /* * Purpose * ======= * * ATL_creftrmvLHN( ... ) * * <=> * * ATL_creftrmv( AtlasLower, AtlasConjTrans, AtlasNonUnit, ... ) * * See ATL_creftrmv for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register float t0_i, t0_r; int i, iaij, incx2 = 2 * INCX, ix, j, jaj, jx, ldap12 = ( ( LDA + 1 ) << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jaj = 0, jx = 0; j < N; j++, jaj += ldap12, jx += incx2 ) { Mmul( A[jaj], -A[jaj+1], X[jx] , X[jx+1], t0_r, t0_i ); for( i = j+1, iaij = jaj+2, ix = jx+incx2; i < N; i++, iaij += 2, ix += incx2 ) { Mmla( A[iaij], -A[iaij+1], X[ix] , X[ix+1], t0_r, t0_i ); } Mset( t0_r, t0_i, X[jx], X[jx+1] ); } /* * End of ATL_creftrmvLHN */ }
void ATL_zreftpmvUCN ( const int N, const double * A, const int LDA, double * X, const int INCX ) { /* * Purpose * ======= * * ATL_zreftpmvUCN( ... ) * * <=> * * ATL_zreftpmv( AtlasUpper, AtlasConj, AtlasNonUnit, ... ) * * See ATL_zreftpmv for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register double t0_i, t0_r; int i, iaij, incx2 = 2 * INCX, ix, j, jaj, jx, lda2 = ( LDA << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jaj = 0, jx = 0; j < N; j++, jx += incx2 ) { Mset( X[jx], X[jx+1], t0_r, t0_i ); for( i = 0, iaij = jaj, ix = 0; i < j; i++, iaij += 2, ix += incx2 ) { Mmla( A[iaij], -A[iaij+1], t0_r, t0_i, X[ix] , X[ix+1] ); } Mmul( A[iaij], -A[iaij+1], t0_r, t0_i, X[jx] , X[jx+1] ); jaj += lda2; lda2 += 2; } /* * End of ATL_zreftpmvUCN */ }
void ATL_zrefgemmNN ( const int M, const int N, const int K, const double * ALPHA, const double * A, const int LDA, const double * B, const int LDB, const double * BETA, double * C, const int LDC ) { /* * .. Local Variables .. */ register double t0_i, t0_r; int i, iail, iblj, icij, j, jal, jbj, jcj, l, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jbj = 0, jcj = 0; j < N; j++, jbj += ldb2, jcj += ldc2 ) { Mzgescal( M, 1, BETA, C+jcj, LDC ); for( l = 0, jal = 0, iblj = jbj; l < K; l++, jal += lda2, iblj += 2 ) { Mmul( ALPHA[0], ALPHA[1], B[iblj], B[iblj+1], t0_r, t0_i ); for( i = 0, iail = jal, icij = jcj; i < M; i++, iail += 2, icij += 2 ) { Mmla( A[iail], A[iail+1], t0_r, t0_i, C[icij], C[icij+1] ); } } } /* * End of ATL_zrefgemmNN */ }
void ATL_zrefhbmvU ( const int N, const int K, const double * ALPHA, const double * A, const int LDA, const double * X, const int INCX, const double * BETA, double * Y, const int INCY ) { /* * Purpose * ======= * * ATL_zrefhbmvU( ... ) * * <=> * * ATL_zrefhbmv( AtlasUpper, ... ) * * See ATL_zrefhbmv for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register double t0_i, t0_r, t1_i, t1_r; int i, i0, iaij, ix, iy, j, jaj, jx, jy, kx = 0, ky = 0, l, incx2 = 2 * INCX, incy2 = 2 * INCY, lda2 = ( LDA << 1 ); /* .. * .. Executable Statements .. * */ Mzvscal( N, BETA, Y, INCY ); for( j = 0, jaj = 0, jx = kx, jy = ky; j < N; j++, jaj += lda2, jx += incx2, jy += incy2 ) { Mmul( ALPHA[0], ALPHA[1], X[jx], X[jx+1], t0_r, t0_i ); Mset( ATL_dZERO, ATL_dZERO, t1_r, t1_i ); l = K - j; i0 = ( j - K > 0 ? j - K : 0 ); for( i = i0, iaij = ((l+i0) << 1)+jaj, ix = kx, iy = ky; i < j; i++, iaij += 2, ix += incx2, iy += incy2 ) { Mmla( A[iaij], A[iaij+1], t0_r, t0_i, Y[iy], Y[iy+1] ); Mmla( A[iaij], -A[iaij+1], X[ix], X[ix+1], t1_r, t1_i ); } Mset( Y[jy] + A[iaij]*t0_r, Y[jy+1] + A[iaij]*t0_i, Y[jy], Y[jy+1] ); Mmla( ALPHA[0], ALPHA[1], t1_r, t1_i, Y[jy], Y[jy+1] ); if( j >= K ) { kx += incx2; ky += incy2; } } /* * End of ATL_zrefhbmvU */ }
void ATL_zrefher2kLN ( const int N, const int K, const double * ALPHA, const double * A, const int LDA, const double * B, const int LDB, const double BETA, double * C, const int LDC ) { /* * Purpose * ======= * * ATL_zrefher2kLN( ... ) * * <=> * * ATL_zrefher2k( AtlasLower, AtlasNoTrans, ... ) * * See ATL_zrefher2k for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ double t0_i, t0_r, t1_i, t1_r; int i, iail, iaj, iajl, ibil, ibj, ibjl, icij, j, jal, jbl, jcj, l, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, iaj = 0, ibj = 0, jcj = 0; j < N; j++, iaj += 2, ibj += 2, jcj += ldc2 ) { icij = ( j << 1 ) + jcj; Mdelscal( BETA, C[icij] ); C[icij+1] = ATL_dZERO; Mdvscal( ((N-j-1) << 1), BETA, C+icij+2, 1 ); for( l = 0, iajl = iaj, ibjl = ibj, jal = 0, jbl = 0; l < K; l++, iajl += lda2, ibjl += ldb2, jal += lda2, jbl += ldb2 ) { Mmul( ALPHA[0], ALPHA[1], B[ibjl], -B[ibjl+1], t0_r, t0_i ); Mmul( ALPHA[0], -ALPHA[1], A[iajl], -A[iajl+1], t1_r, t1_i ); iail = ( j << 1 ) + jal; ibil = ( j << 1 ) + jbl, icij = ( j << 1 ) + jcj; Mset( C[icij] + A[iail] * t0_r - A[iail+1] * t0_i + B[ibil] * t1_r - B[ibil+1] * t1_i, ATL_dZERO, C[icij], C[icij+1] ); iail += 2; ibil += 2; icij += 2; for( i = j+1; i < N; i++, iail += 2, ibil += 2, icij += 2 ) { Mmla( A[iail], A[iail+1], t0_r, t0_i, C[icij], C[icij+1] ); Mmla( B[ibil], B[ibil+1], t1_r, t1_i, C[icij], C[icij+1] ); } } } /* * End of ATL_zrefher2kLN */ }
void ATL_crefhemmRL ( const int M, const int N, const float * ALPHA, const float * A, const int LDA, const float * B, const int LDB, const float * BETA, float * C, const int LDC ) { /* * Purpose * ======= * * ATL_crefhemmRL( ... ) * * <=> * * ATL_crefhemm( AtlasRight, AtlasLower, ... ) * * See ATL_crefhemm for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register float t0_i, t0_r; int i, iaj, iajk, iakj, ibij, ibik, icij, j, jaj, jbj, jbk, jcj, k, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, iaj = 0, jaj = 0, jbj = 0, jcj = 0; j < N; j++, iaj += 2, jaj += lda2, jbj += ldb2, jcj += ldc2 ) { i = ( j << 1 ) + jaj; Mset( ALPHA[0] * A[i], ALPHA[1] * A[i], t0_r, t0_i ); for( i = 0, ibij = jbj, icij = jcj; i < M; i++, ibij += 2, icij += 2 ) { Mcelscal( BETA[0], BETA[1], C[icij], C[icij+1] ); Mmla( t0_r, t0_i, B[ibij], B[ibij+1], C[icij], C[icij+1] ); } for( k = 0, iajk = iaj, jbk = 0; k < j; k++, iajk += lda2, jbk += ldb2 ) { Mmul( ALPHA[0], ALPHA[1], A[iajk], -A[iajk+1], t0_r, t0_i ); for( i = 0, ibik = jbk, icij = jcj; i < M; i++, ibik += 2, icij += 2 ) { Mmla( t0_r, t0_i, B[ibik], B[ibik+1], C[icij], C[icij+1] ); } } for( k = j+1, iakj = ((j+1) << 1)+jaj, jbk = (j+1)*ldb2; k < N; k++, iakj += 2, jbk += ldb2 ) { Mmul( ALPHA[0], ALPHA[1], A[iakj], A[iakj+1], t0_r, t0_i ); for( i = 0, ibik = jbk, icij = jcj; i < M; i++, ibik += 2, icij += 2 ) { Mmla( t0_r, t0_i, B[ibik], B[ibik+1], C[icij], C[icij+1] ); } } } /* * End of ATL_crefhemmRL */ }
void ATL_crefhpmvU ( const int N, const float * ALPHA, const float * A, const int LDA, const float * X, const int INCX, const float * BETA, float * Y, const int INCY ) { /* * Purpose * ======= * * ATL_crefhpmvU( ... ) * * <=> * * ATL_crefhpmv( AtlasUpper, ... ) * * See ATL_crefhpmv for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ /* * .. Local Variables .. */ register float t0_i, t0_r, t1_i, t1_r; int i, iaij, ix, iy, j, jaj = 0, jx, jy, lda2 = ( LDA << 1 ), incx2 = 2 * INCX, incy2 = 2 * INCY; /* .. * .. Executable Statements .. * */ Mcvscal( N, BETA, Y, INCY ); for( j = 0, jaj = 0, jx = 0, jy = 0; j < N; j++, jx += incx2, jy += incy2 ) { Mmul( ALPHA[0], ALPHA[1], X[jx], X[jx+1], t0_r, t0_i ); Mset( ATL_sZERO, ATL_sZERO, t1_r, t1_i ); for( i = 0, iaij = jaj, ix = 0, iy = 0; i < j; i++, iaij += 2, ix += incx2, iy += incy2 ) { Mmla( A[iaij], A[iaij+1], t0_r, t0_i, Y[iy], Y[iy+1] ); Mmla( A[iaij], -A[iaij+1], X[ix], X[ix+1], t1_r, t1_i ); } Mset( Y[jy] + A[iaij]*t0_r, Y[jy+1] + A[iaij]*t0_i, Y[jy], Y[jy+1] ); Mmla( ALPHA[0], ALPHA[1], t1_r, t1_i, Y[jy], Y[jy+1] ); jaj += lda2; lda2 += 2; } /* * End of ATL_crefhpmvU */ }
void ATL_zrefsymmLU ( const int M, const int N, const double * ALPHA, const double * A, const int LDA, const double * B, const int LDB, const double * BETA, double * C, const int LDC ) { /* * Purpose * ======= * * ATL_zrefsymmLU( ... ) * * <=> * * ATL_zrefsymm( AtlasLeft, AtlasUpper, ... ) * * See ATL_zrefsymm for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register double t0_i, t0_r, t1_i, t1_r; int i, iaki, ibij, ibkj, icij, ickj, j, jai, jbj, jcj, k, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jbj = 0, jcj = 0; j < N; j++, jbj += ldb2, jcj += ldc2 ) { for( i = 0, jai = 0, ibij = jbj, icij = jcj; i < M; i++, jai += lda2, ibij += 2, icij += 2 ) { Mmul( ALPHA[0], ALPHA[1], B[ibij], B[ibij+1], t0_r, t0_i ); Mset( ATL_dZERO, ATL_dZERO, t1_r, t1_i ); for( k = 0, iaki = jai, ibkj = jbj, ickj = jcj; k < i; k++, iaki += 2, ibkj += 2, ickj += 2 ) { Mmla( A[iaki], A[iaki+1], t0_r, t0_i, C[ickj], C[ickj+1] ); Mmla( B[ibkj], B[ibkj+1], A[iaki], A[iaki+1], t1_r, t1_i ); } Mzelscal( BETA[0], BETA[1], C[icij], C[icij+1] ); k = ( i << 1 ) + jai; Mmla( t0_r, t0_i, A[k], A[k+1], C[icij], C[icij+1] ); Mmla( ALPHA[0], ALPHA[1], t1_r, t1_i, C[icij], C[icij+1] ); } } /* * End of ATL_zrefsymmLU */ }
void ATL_crefgerc ( const int M, const int N, const float * ALPHA, const float * X, const int INCX, const float * Y, const int INCY, float * A, const int LDA ) { /* * Purpose * ======= * * ATL_crefgerc performs the rank 1 operation * * A := alpha * x * conjg( y' ) + A, * * where alpha is a scalar, x is an m-element vector, y is an n-element * vector and A is an m by n matrix. * * Arguments * ========= * * M (input) const int * On entry, M specifies the number of rows of the matrix A. * M must be at least zero. Unchanged on exit. * * N (input) const int * On entry, N specifies the number of columns of the matrix A. * N must be at least zero. Unchanged on exit. * * ALPHA (input) const float * * On entry, ALPHA specifies the scalar alpha. When ALPHA is * supplied as zero then the arrays X and Y need not be set on * input. Unchanged on exit. * * X (input) const float * * On entry, X points to the first entry to be accessed of an * incremented array of size equal to or greater than * ( 1 + ( m - 1 ) * abs( INCX ) ) * sizeof( float [2] ), * that contains the vector x. Unchanged on exit. * * INCX (input) const int * On entry, INCX specifies the increment for the elements of X. * INCX must not be zero. Unchanged on exit. * * Y (input) const float * * On entry, Y points to the first entry to be accessed of an * incremented array of size equal to or greater than * ( 1 + ( n - 1 ) * abs( INCY ) ) * sizeof( float [2] ), * that contains the vector y. Unchanged on exit. * * INCY (input) const int * On entry, INCY specifies the increment for the elements of Y. * INCY must not be zero. Unchanged on exit. * * A (input/output) float * * On entry, A points to an array of size equal to or greater * than LDA * n * sizeof( float [2] ). Before entry, the lea- * ding m by n part of the array A must contain the matrix * coefficients. On exit, A is overwritten by the updated ma- * trix. * * LDA (input) const int * On entry, LDA specifies the first dimension of A as declared * in the calling (sub) program. LDA must be at least max(1,m). * Unchanged on exit. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register float t0_i, t0_r; int i, iaij, incx2 = 2 * INCX, incy2 = 2 * INCY, ix, j, jaj, jy, lda2 = ( LDA << 1 ); /* .. * .. Executable Statements .. * */ if( ( M == 0 ) || ( N == 0 ) || Mszero( ALPHA[0], ALPHA[1] ) ) return; for( j = 0, jaj = 0, jy = 0; j < N; j++, jaj += lda2, jy += incy2 ) { Mmul( ALPHA[0], ALPHA[1], Y[jy], -Y[jy+1], t0_r, t0_i ); for( i = 0, iaij = jaj, ix = 0; i < M; i++, iaij += 2, ix += incx2 ) { Mmla( X[ix], X[ix+1], t0_r, t0_i, A[iaij], A[iaij+1] ); } } /* * End of ATL_crefgerc */ }
void ATL_crefsymmLL ( const int M, const int N, const float * ALPHA, const float * A, const int LDA, const float * B, const int LDB, const float * BETA, float * C, const int LDC ) { /* * Purpose * ======= * * ATL_crefsymmLL( ... ) * * <=> * * ATL_crefsymm( AtlasLeft, AtlasLower, ... ) * * See ATL_crefsymm for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ register float t0_i, t0_r, t1_i, t1_r; int i, iaki, ibij, ibkj, icij, ickj, j, jai, jbj, jcj, k, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, jbj = 0, jcj = 0; j < N; j++, jbj += ldb2, jcj += ldc2 ) { for( i = M-1, jai = (M-1)*lda2, ibij = ( (M-1) << 1 )+jbj, icij = ( (M-1) << 1 )+jcj; i >= 0; i--, jai -= lda2, ibij -= 2, icij -= 2 ) { Mmul( ALPHA[0], ALPHA[1], B[ibij], B[ibij+1], t0_r, t0_i ); Mset( ATL_sZERO, ATL_sZERO, t1_r, t1_i ); for( k = i+1, iaki = ( (i+1) << 1 )+jai, ibkj = ( (i+1) << 1 )+jbj, ickj = ( (i+1) << 1 )+jcj; k < M; k++, iaki += 2, ibkj += 2, ickj += 2 ) { Mmla( A[iaki], A[iaki+1], t0_r, t0_i, C[ickj], C[ickj+1] ); Mmla( B[ibkj], B[ibkj+1], A[iaki], A[iaki+1], t1_r, t1_i ); } Mcelscal( BETA[0], BETA[1], C[icij], C[icij+1] ); k = ( i << 1 ) + jai; Mmla( t0_r, t0_i, A[k], A[k+1], C[icij], C[icij+1] ); Mmla( ALPHA[0], ALPHA[1], t1_r, t1_i, C[icij], C[icij+1] ); } } /* * End of ATL_crefsymmLL */ }
void ATL_crefher2kUN ( const int N, const int K, const float * ALPHA, const float * A, const int LDA, const float * B, const int LDB, const float BETA, float * C, const int LDC ) { /* * Purpose * ======= * * ATL_crefher2kUN( ... ) * * <=> * * ATL_crefher2k( AtlasUpper, AtlasNoTrans, ... ) * * See ATL_crefher2k for details. * * --------------------------------------------------------------------- */ /* * .. Local Variables .. */ float t0_i, t0_r, t1_i, t1_r; int i, iail, iaj, iajl, ibil, ibj, ibjl, icij, j, jal, jbl, jcj, l, lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 ); /* .. * .. Executable Statements .. * */ for( j = 0, iaj = 0, ibj = 0, jcj = 0; j < N; j++, iaj += 2, ibj += 2, jcj += ldc2 ) { Msvscal( (j << 1), BETA, C+jcj, 1 ); icij = ( j << 1 ) + jcj; Mselscal( BETA, C[icij] ); C[icij+1] = ATL_sZERO; for( l = 0, iajl = iaj, ibjl = ibj, jal = 0, jbl = 0; l < K; l++, iajl += lda2, ibjl += ldb2, jal += lda2, jbl += ldb2 ) { Mmul( ALPHA[0], ALPHA[1], B[ibjl], -B[ibjl+1], t0_r, t0_i ); Mmul( ALPHA[0], -ALPHA[1], A[iajl], -A[iajl+1], t1_r, t1_i ); for( i = 0, iail = jal, ibil = jbl, icij = jcj; i < j; i++, iail += 2, ibil += 2, icij += 2 ) { Mmla( A[iail], A[iail+1], t0_r, t0_i, C[icij], C[icij+1] ); Mmla( B[ibil], B[ibil+1], t1_r, t1_i, C[icij], C[icij+1] ); } Mset( C[icij] + A[iail] * t0_r - A[iail+1] * t0_i + B[ibil] * t1_r - B[ibil+1] * t1_i, ATL_sZERO, C[icij], C[icij+1] ); } } /* * End of ATL_crefher2kUN */ }