Пример #1
0
void ATL_creftrmmLUCN
(
   const int                  M,
   const int                  N,
   const float                * ALPHA,
   const float                * A,
   const int                  LDA,
   float                      * B,
   const int                  LDB
)
{
/*
 * Purpose
 * =======
 *
 * ATL_creftrmmLUCN( ... )
 *
 * <=>
 *
 * ATL_creftrmm
 * ( AtlasLeft, AtlasUpper, AtlasConjTrans, AtlasNonUnit, ... )
 *
 * See ATL_creftrmm for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   float                      t0_i, t0_r;
   int                        i, iaki, ibij, ibkj, j, jai, jbj, k,
                              lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jbj = 0; j < N; j++, jbj += ldb2 )
   {
      for( i = M-1,     jai  = (M-1)*lda2, ibij  = ((M-1)<<1)+jbj;
           i >= 0; i--, jai -= lda2,       ibij -= 2 )
      {
         Mset( B[ibij], B[ibij+1], t0_r, t0_i );
         k = ( i << 1 ) + jai; Msscl( A[k], -A[k+1], t0_r, t0_i );
         for( k = 0, iaki = jai, ibkj = jbj; k < i; k++, iaki += 2, ibkj += 2 )
         { Mmla( A[iaki], -A[iaki+1], B[ibkj], B[ibkj+1], t0_r, t0_i ); }
         Mmul( ALPHA[0], ALPHA[1], t0_r, t0_i, B[ibij], B[ibij+1] );
      }
   }
/*
 * End of ATL_creftrmmLUCN
 */
}
Пример #2
0
void ATL_creftrsmLLTU
(
   const int                  M,
   const int                  N,
   const float                * ALPHA,
   const float                * A,
   const int                  LDA,
   float                      * B,
   const int                  LDB
)
{
/*
 * Purpose
 * =======
 *
 * ATL_creftrsmLLTU( ... )
 *
 * <=>
 *
 * ATL_creftrsm
 * ( AtlasLeft, AtlasLower, AtlasTrans, AtlasUnit, ... )
 *
 * See ATL_creftrsm for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r;
   int                        i, iaki, ibij, ibkj, j, jai, jbj, k,
                              lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jbj = 0; j < N; j++, jbj += ldb2 )
   {
      for( i = M-1,     jai  = (M-1)*lda2, ibij  = ((M-1) << 1)+jbj;
           i >= 0; i--, jai -= lda2,       ibij -= 2 )
      {
         Mmul( ALPHA[0], ALPHA[1], B[ibij], B[ibij+1], t0_r, t0_i );
         for( k = i+1, iaki  = ((i+1) << 1)+jai, ibkj  = ((i+1) << 1)+jbj;
              k < M; k++, iaki += 2, ibkj += 2 )
         { Mmls( A[iaki], A[iaki+1], B[ibkj], B[ibkj+1], t0_r, t0_i ); }
         Mset( t0_r, t0_i, B[ibij], B[ibij+1] );
      }
   }
/*
 * End of ATL_creftrsmLLTU
 */
}
Пример #3
0
void ATL_zreftrmmLLNU
(
   const int                  M,
   const int                  N,
   const double               * ALPHA,
   const double               * A,
   const int                  LDA,
   double                     * B,
   const int                  LDB
)
{
/*
 * Purpose
 * =======
 *
 * ATL_zreftrmmLLNU( ... )
 *
 * <=>
 *
 * ATL_zreftrmm
 * ( AtlasLeft, AtlasLower, AtlasNoTrans, AtlasUnit, ... )
 *
 * See ATL_zreftrmm for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   double                     t0_i, t0_r;
   int                        i, iaik, ibij, ibkj, j, jak, jbj, k,
                              lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jbj  = 0; j < N; j++, jbj += ldb2 )
   {
      for( k = M-1,     jak  = (M-1)*lda2, ibkj  = ((M-1)<<1)+jbj;
           k >= 0; k--, jak -= lda2,       ibkj -= 2 )
      {
         Mmul( ALPHA[0], ALPHA[1], B[ibkj], B[ibkj+1], t0_r, t0_i );
         Mset( t0_r, t0_i, B[ibkj], B[ibkj+1] );
         for( i = k+1, iaik  = ((k+1)<<1)+jak, ibij = ((k+1)<<1)+jbj;
           i < M; i++, iaik += 2,              ibij += 2 )
         { Mmla( t0_r, t0_i, A[iaik], A[iaik+1], B[ibij], B[ibij+1] ); }
      }
   }
/*
 * End of ATL_zreftrmmLLNU
 */
}
Пример #4
0
void ATL_crefgpmvLC
(
   const int                  M,
   const int                  N,
   const float                * ALPHA,
   const float                * A,
   const int                  LDA,
   const float                * X,
   const int                  INCX,
   const float                * BETA,
   float                      * Y,
   const int                  INCY
)
{
/*
 * Purpose
 * =======
 *
 * ATL_crefgpmvLC( ... )
 *
 * <=>
 *
 * ATL_crefgpmv( AtlasLower, AtlasConj, ... )
 *
 * See ATL_crefgpmv for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r;
   int                        i, iaij, incx2 = 2 * INCX, incy2 = 2 * INCY,
                              iy, j, jaj, jx, lda2 = ( LDA << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   Mcvscal( M, BETA, Y, INCY );

   for( j = 0, jaj = 0, jx = 0; j < N; j++, jx += incx2 )
   {
      Mmul( ALPHA[0], ALPHA[1], X[jx], X[jx+1], t0_r, t0_i );

      for( i = 0, iaij = jaj, iy = 0; i < M; i++, iaij += 2, iy += incy2 )
      { Mmla( A[iaij], -A[iaij+1], t0_r, t0_i, Y[iy], Y[iy+1] ); }
      lda2 -= 2; jaj += lda2;
   }
/*
 * End of ATL_crefgpmvLC
 */
}
Пример #5
0
void ATL_crefsyrkLN
(
   const int                  N,
   const int                  K,
   const float                * ALPHA,
   const float                * A,
   const int                  LDA,
   const float                * BETA,
   float                      * C,
   const int                  LDC
)
{
/*
 * Purpose
 * =======
 *
 * ATL_crefsyrkLN( ... )
 *
 * <=>
 *
 * ATL_crefsyrk( AtlasLower, AtlasNoTrans, ... )
 *
 * See ATL_crefsyrk for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r;
   int                        i, iail, iaj, iajl, icij, j, jal, jcj, l,
                              lda2 = ( LDA << 1 ), ldc2 = ( LDC << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, iaj = 0, jcj  = 0; j < N; j++, iaj += 2, jcj += ldc2 )
   {
      Mcvscal( N-j, BETA, C+(j << 1)+jcj, 1 );
      for( l = 0, iajl = iaj, jal = 0; l < K; l++, iajl += lda2, jal += lda2 )
      {
         Mmul( ALPHA[0], ALPHA[1], A[iajl], A[iajl+1], t0_r, t0_i );
         for( i = j,      iail  = (j << 1)+jal, icij  = (j << 1)+jcj;
              i < N; i++, iail += 2,            icij += 2 )
         { Mmla( t0_r, t0_i, A[iail], A[iail+1], C[icij], C[icij+1] ); }
      }
   }
/*
 * End of ATL_crefsyrkLN
 */
}
Пример #6
0
void ATL_creftrsmLUTN
(
   const int                  M,
   const int                  N,
   const float                * ALPHA,
   const float                * A,
   const int                  LDA,
   float                      * B,
   const int                  LDB
)
{
/*
 * Purpose
 * =======
 *
 * ATL_creftrsmLUTN( ... )
 *
 * <=>
 *
 * ATL_creftrsm
 * ( AtlasLeft, AtlasUpper, AtlasTrans, AtlasNonUnit, ... )
 *
 * See ATL_creftrsm for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r;
   int                        i, iaki, ibij, ibkj, j, jai, jbj, k,
                              lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jbj = 0; j < N; j++, jbj += ldb2 )
   {
      for( i = 0, jai = 0, ibij  = jbj; i < M; i++, jai += lda2, ibij += 2 )
      {
         Mmul( ALPHA[0], ALPHA[1], B[ibij], B[ibij+1], t0_r, t0_i );
         for( k = 0, iaki = jai, ibkj = jbj; k < i; k++, iaki += 2, ibkj += 2 )
         { Mmls( A[iaki], A[iaki+1], B[ibkj], B[ibkj+1], t0_r, t0_i ); }
         k = ( i << 1 ) + jai; Msdiv( A[k], A[k+1], t0_r, t0_i );
         Mset( t0_r, t0_i, B[ibij], B[ibij+1] );
      }
   }
/*
 * End of ATL_creftrsmLUTN
 */
}
Пример #7
0
void ATL_zreftrmmLLCU
(
   const int                  M,
   const int                  N,
   const double               * ALPHA,
   const double               * A,
   const int                  LDA,
   double                     * B,
   const int                  LDB
)
{
/*
 * Purpose
 * =======
 *
 * ATL_zreftrmmLLCU( ... )
 *
 * <=>
 *
 * ATL_zreftrmm
 * ( AtlasLeft, AtlasLower, AtlasConjTrans, AtlasUnit, ... )
 *
 * See ATL_zreftrmm for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   double                     t0_i, t0_r;
   int                        i, iaki, ibij, ibkj, j, jai, jbj, k,
                              lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jbj = 0; j < N; j++, jbj += ldb2 )
   {
      for( i = 0, jai = 0, ibij = jbj; i < M; i++, jai += lda2, ibij += 2 )
      {
         Mset( B[ibij], B[ibij+1], t0_r, t0_i );
         for( k = i+1, iaki  = ((i+1)<<1)+jai, ibkj  = ((i+1)<<1)+jbj;
           k < M; k++, iaki += 2,              ibkj += 2 )
         { Mmla( A[iaki], -A[iaki+1], B[ibkj], B[ibkj+1], t0_r, t0_i ); }
         Mmul( ALPHA[0], ALPHA[1], t0_r, t0_i, B[ibij], B[ibij+1] );
      }
   }
/*
 * End of ATL_zreftrmmLLCU
 */
}
Пример #8
0
void ATL_zrefsyrkUN
(
   const int                  N,
   const int                  K,
   const double               * ALPHA,
   const double               * A,
   const int                  LDA,
   const double               * BETA,
   double                     * C,
   const int                  LDC
)
{
/*
 * Purpose
 * =======
 *
 * ATL_zrefsyrkUN( ... )
 *
 * <=>
 *
 * ATL_zrefsyrk( AtlasUpper, AtlasNoTrans, ... )
 *
 * See ATL_zrefsyrk for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register double            t0_i, t0_r;
   int                        i, iail, iaj, iajl, icij, j, jal, jcj, l,
                              lda2 = ( LDA << 1 ), ldc2 = ( LDC << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, iaj = 0, jcj  = 0; j < N; j++, iaj += 2, jcj += ldc2 )
   {
      Mzvscal( j+1, BETA, C+jcj, 1 );

      for( l = 0, iajl = iaj, jal = 0; l < K; l++, iajl += lda2, jal += lda2 )
      {
         Mmul( ALPHA[0], ALPHA[1], A[iajl], A[iajl+1], t0_r, t0_i );
         for( i = 0, iail = jal, icij = jcj; i <= j; i++, iail += 2, icij += 2 )
         { Mmla( t0_r, t0_i, A[iail], A[iail+1], C[icij], C[icij+1] ); }
      }
   }
/*
 * End of ATL_zrefsyrkUN
 */
}
Пример #9
0
void ATL_creftbmvUNN
(
   const int                  N,
   const int                  K,
   const float                * A,
   const int                  LDA,
   float                      * X,
   const int                  INCX
)
{
/*
 * Purpose
 * =======
 *
 * ATL_creftbmvUNN( ... )
 *
 * <=>
 *
 * ATL_creftbmv( AtlasUpper, AtlasNoTrans, AtlasNonUnit, ... )
 *
 * See ATL_creftbmv for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r;
   int                        i, i0, iaij, incx2 = 2 * INCX, ix, j, jaj,
                              jx, kx = 0, l, lda2 = ( LDA << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jaj = 0, jx = kx; j < N; j++, jaj += lda2, jx += incx2 )
   {
      Mset( X[jx], X[jx+1], t0_r, t0_i );
      l = K - j; i0 = ( j - K > 0 ? j - K : 0 );
      for( i = i0,     iaij  = ((l+i0) << 1)+jaj, ix  = kx;
           i < j; i++, iaij += 2,                 ix += incx2 )
      { Mmla( A[iaij], A[iaij+1], t0_r, t0_i, X[ix] , X[ix+1] ); }
      Mmul( A[iaij], A[iaij+1], t0_r, t0_i, X[jx] , X[jx+1] );
      if( j >= K ) { kx += incx2; }
   }
/*
 * End of ATL_creftbmvUNN
 */
}
Пример #10
0
void ATL_creftbmvLTN
(
   const int                  N,
   const int                  K,
   const float                * A,
   const int                  LDA,
   float                      * X,
   const int                  INCX
)
{
/*
 * Purpose
 * =======
 *
 * ATL_creftbmvLTN( ... )
 *
 * <=>
 *
 * ATL_creftbmv( AtlasLower, AtlasTrans, AtlasNonUnit, ... )
 *
 * See ATL_creftbmv for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r;
   int                        i, i1, iaij, incx2 = 2 * INCX, ix, j, jaj,
                              jx, kx = 0, lda2 = ( LDA << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jaj = 0, jx = kx; j < N; j++, jaj += lda2, jx += incx2 )
   {
      Mmul( A[jaj], A[jaj+1], X[jx] , X[jx+1], t0_r, t0_i );
      i1   = ( N - 1 > j + K ? j + K : N - 1 );
      for( i = j+1,      iaij  = 2+jaj, ix  = jx + incx2;
           i <= i1; i++, iaij += 2,     ix += incx2 )
      { Mmla( A[iaij], A[iaij+1], X[ix] , X[ix+1], t0_r, t0_i ); }
      Mset( t0_r, t0_i, X[jx], X[jx+1] );
   }
/*
 * End of ATL_creftbmvLTN
 */
}
Пример #11
0
void ATL_zrefgemvN
(
   const int                  M,
   const int                  N,
   const double               * ALPHA,
   const double               * A,
   const int                  LDA,
   const double               * X,
   const int                  INCX,
   const double               * BETA,
   double                     * Y,
   const int                  INCY
)
{
/*
 * Purpose
 * =======
 *
 * ATL_zrefgemvN( ... ) <=> ATL_zrefgemv( AtlasNoTrans, ... )
 *
 * See ATL_zrefgemv for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register double            t0_i, t0_r;
   int                        i, iaij, iy, j, jaj, jx;
   int                        incx2 = 2 * INCX, incy2 = 2 * INCY,
                              lda2 = ( LDA << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   Mzvscal( M, BETA, Y, INCY );
   for( j = 0, jaj = 0, jx = 0; j < N; j++, jaj += lda2, jx += incx2 )
   {
      Mmul( ALPHA[0], ALPHA[1], X[jx], X[jx+1], t0_r, t0_i );
      for( i = 0, iaij = jaj, iy = 0; i < M; i++, iaij += 2, iy += incy2 )
      { Mmla( A[iaij],  A[iaij+1], t0_r, t0_i, Y[iy], Y[iy+1] ); }
   }
/*
 * End of ATL_zrefgemvN
 */
}
Пример #12
0
void ATL_creftrmvLHN
(
   const int                  N,
   const float                * A,
   const int                  LDA,
   float                      * X,
   const int                  INCX
)
{
/*
 * Purpose
 * =======
 *
 * ATL_creftrmvLHN( ... )
 *
 * <=>
 *
 * ATL_creftrmv( AtlasLower, AtlasConjTrans, AtlasNonUnit, ... )
 *
 * See ATL_creftrmv for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r;
   int                        i, iaij, incx2 = 2 * INCX, ix, j, jaj, jx,
                              ldap12 = ( ( LDA + 1 ) << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jaj = 0, jx = 0; j < N; j++, jaj += ldap12, jx += incx2 )
   {
      Mmul( A[jaj], -A[jaj+1], X[jx] , X[jx+1], t0_r, t0_i );
      for( i = j+1,    iaij  = jaj+2, ix  = jx+incx2;
           i < N; i++, iaij += 2,     ix += incx2 )
      { Mmla( A[iaij], -A[iaij+1], X[ix] , X[ix+1], t0_r, t0_i ); }
      Mset( t0_r, t0_i, X[jx], X[jx+1] );
   }
/*
 * End of ATL_creftrmvLHN
 */
}
Пример #13
0
void ATL_zreftpmvUCN
(
   const int                  N,
   const double               * A,
   const int                  LDA,
   double                     * X,
   const int                  INCX
)
{
/*
 * Purpose
 * =======
 *
 * ATL_zreftpmvUCN( ... )
 *
 * <=>
 *
 * ATL_zreftpmv( AtlasUpper, AtlasConj, AtlasNonUnit, ... )
 *
 * See ATL_zreftpmv for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register double            t0_i, t0_r;
   int                        i, iaij, incx2 = 2 * INCX, ix, j, jaj, jx,
                              lda2 = ( LDA << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jaj = 0, jx = 0; j < N; j++, jx += incx2 )
   {
      Mset( X[jx], X[jx+1], t0_r, t0_i );
      for( i = 0, iaij = jaj, ix = 0; i < j; i++, iaij += 2, ix += incx2 )
      { Mmla( A[iaij], -A[iaij+1], t0_r, t0_i, X[ix] , X[ix+1] ); }
      Mmul( A[iaij], -A[iaij+1], t0_r, t0_i, X[jx] , X[jx+1] );
      jaj += lda2; lda2 += 2;
   }
/*
 * End of ATL_zreftpmvUCN
 */
}
Пример #14
0
void ATL_zrefgemmNN
(
    const int                  M,
    const int                  N,
    const int                  K,
    const double               * ALPHA,
    const double               * A,
    const int                  LDA,
    const double               * B,
    const int                  LDB,
    const double               * BETA,
    double                     * C,
    const int                  LDC
)
{
    /*
     * .. Local Variables ..
     */
    register double            t0_i, t0_r;
    int                        i, iail, iblj, icij, j, jal, jbj, jcj, l,
                               lda2 = ( LDA << 1 ), ldb2 = ( LDB << 1 ),
                               ldc2 = ( LDC << 1 );
    /* ..
     * .. Executable Statements ..
     *
     */
    for( j = 0, jbj  = 0, jcj  = 0; j < N; j++, jbj += ldb2, jcj += ldc2 )
    {
        Mzgescal( M, 1, BETA, C+jcj, LDC );
        for( l = 0, jal = 0, iblj = jbj; l < K; l++, jal += lda2, iblj += 2 )
        {
            Mmul( ALPHA[0], ALPHA[1], B[iblj], B[iblj+1], t0_r, t0_i );
            for( i = 0, iail = jal, icij = jcj; i < M; i++, iail += 2, icij += 2 )
            {
                Mmla( A[iail], A[iail+1], t0_r, t0_i, C[icij], C[icij+1] );
            }
        }
    }
    /*
     * End of ATL_zrefgemmNN
     */
}
Пример #15
0
void ATL_zrefhbmvU
(
   const int                  N,
   const int                  K,
   const double               * ALPHA,
   const double               * A,
   const int                  LDA,
   const double               * X,
   const int                  INCX,
   const double               * BETA,
   double                     * Y,
   const int                  INCY
)
{
/*
 * Purpose
 * =======
 *
 * ATL_zrefhbmvU( ... )
 *
 * <=>
 *
 * ATL_zrefhbmv( AtlasUpper, ... )
 *
 * See ATL_zrefhbmv for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register double            t0_i, t0_r, t1_i, t1_r;
   int                        i, i0, iaij, ix, iy, j, jaj, jx, jy, kx = 0,
                              ky = 0, l, incx2 = 2 * INCX, incy2 = 2 * INCY,
                              lda2 = ( LDA << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   Mzvscal( N, BETA, Y, INCY );

   for( j = 0,      jaj = 0,     jx  = kx,    jy  = ky;
        j < N; j++, jaj += lda2, jx += incx2, jy += incy2 )
   {
      Mmul( ALPHA[0], ALPHA[1], X[jx], X[jx+1], t0_r, t0_i );
      Mset( ATL_dZERO, ATL_dZERO, t1_r, t1_i );
      l = K - j; i0 = ( j - K > 0 ? j - K : 0 );

      for( i = i0,      iaij  = ((l+i0) << 1)+jaj, ix  = kx,    iy  = ky;
           i < j;  i++, iaij += 2,                 ix += incx2, iy += incy2 )
      {
         Mmla( A[iaij], A[iaij+1], t0_r, t0_i, Y[iy], Y[iy+1] );
         Mmla( A[iaij], -A[iaij+1], X[ix], X[ix+1], t1_r, t1_i );
      }
      Mset( Y[jy] + A[iaij]*t0_r, Y[jy+1] + A[iaij]*t0_i, Y[jy], Y[jy+1] );
      Mmla( ALPHA[0], ALPHA[1], t1_r, t1_i, Y[jy], Y[jy+1] );
      if( j >= K ) { kx += incx2; ky += incy2; }
   }
/*
 * End of ATL_zrefhbmvU
 */
}
Пример #16
0
void ATL_zrefher2kLN
(
   const int                  N,
   const int                  K,
   const double               * ALPHA,
   const double               * A,
   const int                  LDA,
   const double               * B,
   const int                  LDB,
   const double               BETA,
   double                     * C,
   const int                  LDC
)
{
/*
 * Purpose
 * =======
 *
 * ATL_zrefher2kLN( ... )
 *
 * <=>
 *
 * ATL_zrefher2k( AtlasLower, AtlasNoTrans, ... )
 *
 * See ATL_zrefher2k for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   double                     t0_i, t0_r, t1_i, t1_r;
   int                        i, iail, iaj, iajl, ibil, ibj, ibjl, icij,
                              j, jal, jbl, jcj, l, lda2 = ( LDA << 1 ),
                              ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0,      iaj  = 0, ibj  = 0, jcj  = 0;
        j < N; j++, iaj += 2, ibj += 2, jcj += ldc2 )
   {
      icij       = ( j << 1 ) + jcj;
      Mdelscal( BETA, C[icij] ); C[icij+1] = ATL_dZERO;
      Mdvscal( ((N-j-1) << 1), BETA, C+icij+2, 1 );

      for( l = 0,      iajl  = iaj,  ibjl  = ibj,  jal   = 0,    jbl  = 0;
           l < K; l++, iajl += lda2, ibjl += ldb2, jal  += lda2, jbl  += ldb2 )
      {
         Mmul( ALPHA[0],  ALPHA[1], B[ibjl], -B[ibjl+1], t0_r, t0_i );
         Mmul( ALPHA[0], -ALPHA[1], A[iajl], -A[iajl+1], t1_r, t1_i );
         iail = ( j << 1 ) + jal; ibil = ( j << 1 ) + jbl,
         icij = ( j << 1 ) + jcj;
         Mset( C[icij] + A[iail] * t0_r - A[iail+1] * t0_i +
                         B[ibil] * t1_r - B[ibil+1] * t1_i,
               ATL_dZERO, C[icij], C[icij+1] );
         iail += 2; ibil += 2; icij += 2;
         for( i = j+1; i < N; i++, iail += 2, ibil += 2, icij += 2 )
         {
            Mmla( A[iail], A[iail+1], t0_r, t0_i, C[icij], C[icij+1] );
            Mmla( B[ibil], B[ibil+1], t1_r, t1_i, C[icij], C[icij+1] );
         }
      }
   }
/*
 * End of ATL_zrefher2kLN
 */
}
Пример #17
0
void ATL_crefhemmRL
(
   const int                  M,
   const int                  N,
   const float                * ALPHA,
   const float                * A,
   const int                  LDA,
   const float                * B,
   const int                  LDB,
   const float                * BETA,
   float                      * C,
   const int                  LDC
)
{
/*
 * Purpose
 * =======
 *
 * ATL_crefhemmRL( ... )
 *
 * <=>
 *
 * ATL_crefhemm( AtlasRight, AtlasLower, ... )
 *
 * See ATL_crefhemm for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r;
   int                        i, iaj, iajk, iakj, ibij, ibik, icij, j,
                              jaj, jbj, jbk, jcj, k, lda2 = ( LDA << 1 ),
                              ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0,      iaj  = 0, jaj  = 0,    jbj  = 0,    jcj  = 0;
        j < N; j++, iaj += 2, jaj += lda2, jbj += ldb2, jcj += ldc2 )
   {
      i = ( j << 1 ) + jaj;
      Mset( ALPHA[0] * A[i], ALPHA[1] * A[i], t0_r, t0_i );
      for( i = 0, ibij = jbj, icij = jcj; i < M; i++, ibij += 2, icij += 2 )
      {
         Mcelscal( BETA[0], BETA[1], C[icij], C[icij+1] );
         Mmla( t0_r, t0_i, B[ibij], B[ibij+1], C[icij], C[icij+1] );
      }
      for( k = 0, iajk = iaj, jbk = 0; k < j; k++, iajk += lda2, jbk += ldb2 )
      {
         Mmul( ALPHA[0], ALPHA[1], A[iajk], -A[iajk+1], t0_r, t0_i );
         for( i = 0, ibik = jbk, icij = jcj; i < M; i++, ibik += 2, icij += 2 )
         { Mmla( t0_r, t0_i, B[ibik], B[ibik+1], C[icij], C[icij+1] ); }
      }
      for( k = j+1,    iakj  = ((j+1) << 1)+jaj, jbk  = (j+1)*ldb2;
           k < N; k++, iakj += 2,                jbk += ldb2 )
      {
         Mmul( ALPHA[0], ALPHA[1], A[iakj], A[iakj+1], t0_r, t0_i );
         for( i = 0, ibik = jbk, icij = jcj; i < M; i++, ibik += 2, icij += 2 )
         { Mmla( t0_r, t0_i, B[ibik], B[ibik+1], C[icij], C[icij+1] ); }
      }
   }
/*
 * End of ATL_crefhemmRL
 */
}
Пример #18
0
void ATL_crefhpmvU
(
   const int                  N,
   const float                * ALPHA,
   const float                * A,
   const int                  LDA,
   const float                * X,
   const int                  INCX,
   const float                * BETA,
   float                      * Y,
   const int                  INCY
)
{
/*
 * Purpose
 * =======
 *
 * ATL_crefhpmvU( ... )
 *
 * <=>
 *
 * ATL_crefhpmv( AtlasUpper, ... )
 *
 * See ATL_crefhpmv for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r, t1_i, t1_r;
   int                        i, iaij, ix, iy, j, jaj = 0, jx, jy,
                              lda2 = ( LDA << 1 ), incx2 = 2 * INCX,
                              incy2 = 2 * INCY;
/* ..
 * .. Executable Statements ..
 *
 */
   Mcvscal( N, BETA, Y, INCY );

   for( j = 0, jaj = 0, jx = 0, jy = 0; j < N; j++, jx += incx2, jy += incy2 )
   {
      Mmul( ALPHA[0], ALPHA[1], X[jx], X[jx+1], t0_r, t0_i );
      Mset( ATL_sZERO, ATL_sZERO, t1_r, t1_i );

      for( i = 0,      iaij  = jaj, ix  = 0,     iy  = 0;
           i < j; i++, iaij += 2,   ix += incx2, iy += incy2 )
      {
         Mmla( A[iaij], A[iaij+1], t0_r, t0_i, Y[iy], Y[iy+1] );
         Mmla( A[iaij], -A[iaij+1], X[ix], X[ix+1], t1_r, t1_i );
      }
      Mset( Y[jy] + A[iaij]*t0_r, Y[jy+1] + A[iaij]*t0_i, Y[jy], Y[jy+1] );
      Mmla( ALPHA[0], ALPHA[1], t1_r, t1_i, Y[jy], Y[jy+1] );
      jaj += lda2; lda2 += 2;
   }
/*
 * End of ATL_crefhpmvU
 */
}
Пример #19
0
void ATL_zrefsymmLU
(
   const int                  M,
   const int                  N,
   const double               * ALPHA,
   const double               * A,
   const int                  LDA,
   const double               * B,
   const int                  LDB,
   const double               * BETA,
   double                     * C,
   const int                  LDC
)
{
/*
 * Purpose
 * =======
 *
 * ATL_zrefsymmLU( ... )
 *
 * <=>
 *
 * ATL_zrefsymm( AtlasLeft, AtlasUpper, ... )
 *
 * See ATL_zrefsymm for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register double            t0_i, t0_r, t1_i, t1_r;
   int                        i, iaki, ibij, ibkj, icij, ickj, j, jai,
                              jbj, jcj, k, lda2 = ( LDA << 1 ),
                              ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jbj = 0, jcj = 0; j < N; j++, jbj += ldb2, jcj += ldc2 )
   {
      for( i = 0,      jai  = 0,    ibij  = jbj, icij  = jcj;
           i < M; i++, jai += lda2, ibij += 2,   icij += 2 )
      {
         Mmul( ALPHA[0], ALPHA[1], B[ibij], B[ibij+1], t0_r, t0_i );
         Mset( ATL_dZERO, ATL_dZERO, t1_r, t1_i );
         for( k = 0,      iaki  = jai, ibkj  = jbj, ickj  = jcj;
              k < i; k++, iaki += 2,   ibkj += 2,   ickj += 2 )
         {
            Mmla( A[iaki], A[iaki+1], t0_r, t0_i, C[ickj], C[ickj+1] );
            Mmla( B[ibkj], B[ibkj+1], A[iaki], A[iaki+1], t1_r, t1_i );
         }
         Mzelscal( BETA[0], BETA[1], C[icij], C[icij+1] );
         k = ( i << 1 ) + jai;
         Mmla( t0_r, t0_i, A[k], A[k+1], C[icij], C[icij+1] );
         Mmla( ALPHA[0], ALPHA[1], t1_r, t1_i, C[icij], C[icij+1] );
      }
   }
/*
 * End of ATL_zrefsymmLU
 */
}
Пример #20
0
void ATL_crefgerc
(
   const int                  M,
   const int                  N,
   const float                * ALPHA,
   const float                * X,
   const int                  INCX,
   const float                * Y,
   const int                  INCY,
   float                      * A,
   const int                  LDA
)
{
/*
 * Purpose
 * =======
 *
 * ATL_crefgerc performs the rank 1 operation
 *
 *    A := alpha * x * conjg( y' ) + A,
 *
 * where alpha is a scalar,  x is an m-element vector, y is an n-element
 * vector and A is an m by n matrix.
 *
 * Arguments
 * =========
 *
 * M       (input)                       const int
 *         On entry,  M  specifies the number of rows of  the matrix  A.
 *         M must be at least zero. Unchanged on exit.
 *
 * N       (input)                       const int
 *         On entry, N  specifies the number of columns of the matrix A.
 *         N  must be at least zero. Unchanged on exit.
 *
 * ALPHA   (input)                       const float *
 *         On entry, ALPHA specifies the scalar alpha.   When  ALPHA  is
 *         supplied as zero then the arrays X and Y need not be set on
 *         input. Unchanged on exit.
 *
 * X       (input)                       const float *
 *         On entry,  X  points to the  first entry to be accessed of an
 *         incremented array of size equal to or greater than
 *            ( 1 + ( m - 1 ) * abs( INCX ) ) * sizeof( float [2] ),
 *         that contains the vector x. Unchanged on exit.
 *
 * INCX    (input)                       const int
 *         On entry, INCX specifies the increment for the elements of X.
 *         INCX must not be zero. Unchanged on exit.
 *
 * Y       (input)                       const float *
 *         On entry,  Y  points to the  first entry to be accessed of an
 *         incremented array of size equal to or greater than
 *            ( 1 + ( n - 1 ) * abs( INCY ) ) * sizeof( float [2] ),
 *         that contains the vector y. Unchanged on exit.
 *
 * INCY    (input)                       const int
 *         On entry, INCY specifies the increment for the elements of Y.
 *         INCY must not be zero. Unchanged on exit.
 *
 * A       (input/output)                float *
 *         On entry,  A  points  to an array of size equal to or greater
 *         than   LDA * n * sizeof( float [2] ).  Before entry, the lea-
 *         ding  m by n  part of the array  A  must  contain the  matrix
 *         coefficients.  On exit,  A  is overwritten by the updated ma-
 *         trix.
 *
 * LDA     (input)                       const int
 *         On entry, LDA  specifies the first dimension of A as declared
 *         in the calling (sub) program. LDA must be at least  max(1,m).
 *         Unchanged on exit.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r;
   int                        i, iaij, incx2 = 2 * INCX, incy2 = 2 * INCY,
                              ix, j, jaj, jy, lda2 = ( LDA << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   if( ( M == 0 ) || ( N == 0 ) || Mszero( ALPHA[0], ALPHA[1] ) ) return;

   for( j = 0, jaj = 0, jy = 0; j < N; j++, jaj += lda2, jy += incy2 )
   {
      Mmul( ALPHA[0], ALPHA[1], Y[jy], -Y[jy+1], t0_r, t0_i );
      for( i = 0, iaij = jaj, ix = 0; i < M; i++, iaij += 2, ix += incx2 )
      { Mmla( X[ix], X[ix+1], t0_r, t0_i, A[iaij], A[iaij+1] ); }
   }
/*
 * End of ATL_crefgerc
 */
}
Пример #21
0
void ATL_crefsymmLL
(
   const int                  M,
   const int                  N,
   const float                * ALPHA,
   const float                * A,
   const int                  LDA,
   const float                * B,
   const int                  LDB,
   const float                * BETA,
   float                      * C,
   const int                  LDC
)
{
/*
 * Purpose
 * =======
 *
 * ATL_crefsymmLL( ... )
 *
 * <=>
 *
 * ATL_crefsymm( AtlasLeft, AtlasLower, ... )
 *
 * See ATL_crefsymm for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   register float             t0_i, t0_r, t1_i, t1_r;
   int                        i, iaki, ibij, ibkj, icij, ickj, j, jai,
                              jbj, jcj, k, lda2 = ( LDA << 1 ),
                              ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0, jbj = 0, jcj = 0; j < N; j++, jbj += ldb2, jcj += ldc2 )
   {
      for( i = M-1, jai  = (M-1)*lda2, ibij  = ( (M-1) << 1 )+jbj,
           icij  = ( (M-1) << 1 )+jcj; i >= 0;
           i--, jai -= lda2, ibij -= 2, icij -= 2 )
      {
         Mmul( ALPHA[0], ALPHA[1], B[ibij], B[ibij+1], t0_r, t0_i );
         Mset( ATL_sZERO, ATL_sZERO, t1_r, t1_i );
         for( k = i+1, iaki = ( (i+1) << 1 )+jai, ibkj = ( (i+1) << 1 )+jbj,
              ickj = ( (i+1) << 1 )+jcj; k < M;
              k++, iaki += 2, ibkj += 2, ickj += 2 )
         {
            Mmla( A[iaki], A[iaki+1], t0_r, t0_i, C[ickj], C[ickj+1] );
            Mmla( B[ibkj], B[ibkj+1], A[iaki], A[iaki+1], t1_r, t1_i );
         }
         Mcelscal( BETA[0], BETA[1], C[icij], C[icij+1] );
         k = ( i << 1 ) + jai;
         Mmla( t0_r, t0_i, A[k], A[k+1], C[icij], C[icij+1] );
         Mmla( ALPHA[0], ALPHA[1], t1_r, t1_i, C[icij], C[icij+1] );
      }
   }
/*
 * End of ATL_crefsymmLL
 */
}
Пример #22
0
void ATL_crefher2kUN
(
   const int                  N,
   const int                  K,
   const float                * ALPHA,
   const float                * A,
   const int                  LDA,
   const float                * B,
   const int                  LDB,
   const float                BETA,
   float                      * C,
   const int                  LDC
)
{
/*
 * Purpose
 * =======
 *
 * ATL_crefher2kUN( ... )
 *
 * <=>
 *
 * ATL_crefher2k( AtlasUpper, AtlasNoTrans, ... )
 *
 * See ATL_crefher2k for details.
 *
 * ---------------------------------------------------------------------
 */
/*
 * .. Local Variables ..
 */
   float                      t0_i, t0_r, t1_i, t1_r;
   int                        i, iail, iaj, iajl, ibil, ibj, ibjl, icij,
                              j, jal, jbl, jcj, l, lda2 = ( LDA << 1 ),
                              ldb2 = ( LDB << 1 ), ldc2 = ( LDC << 1 );
/* ..
 * .. Executable Statements ..
 *
 */
   for( j = 0,      iaj  = 0, ibj  = 0, jcj  = 0;
        j < N; j++, iaj += 2, ibj += 2, jcj += ldc2 )
   {
      Msvscal( (j << 1), BETA, C+jcj, 1 );
      icij       = ( j << 1 ) + jcj;
      Mselscal( BETA, C[icij] ); C[icij+1] = ATL_sZERO;

      for( l = 0,      iajl  = iaj,  ibjl  = ibj,  jal   = 0,    jbl   = 0;
           l < K; l++, iajl += lda2, ibjl += ldb2, jal  += lda2, jbl  += ldb2 )
      {
         Mmul( ALPHA[0],  ALPHA[1], B[ibjl], -B[ibjl+1], t0_r, t0_i );
         Mmul( ALPHA[0], -ALPHA[1], A[iajl], -A[iajl+1], t1_r, t1_i );
         for( i = 0,      iail  = jal, ibil  = jbl, icij = jcj;
              i < j; i++, iail += 2,   ibil += 2,   icij += 2 )
         {
            Mmla( A[iail], A[iail+1], t0_r, t0_i, C[icij], C[icij+1] );
            Mmla( B[ibil], B[ibil+1], t1_r, t1_i, C[icij], C[icij+1] );
         }
         Mset( C[icij] + A[iail] * t0_r - A[iail+1] * t0_i +
                         B[ibil] * t1_r - B[ibil+1] * t1_i,
               ATL_sZERO, C[icij], C[icij+1] );
      }
   }
/*
 * End of ATL_crefher2kUN
 */
}