lapack_int LAPACKE_cuncsd_work( int matrix_layout, char jobu1, char jobu2, char jobv1t, char jobv2t, char trans, char signs, lapack_int m, lapack_int p, lapack_int q, lapack_complex_float* x11, lapack_int ldx11, lapack_complex_float* x12, lapack_int ldx12, lapack_complex_float* x21, lapack_int ldx21, lapack_complex_float* x22, lapack_int ldx22, float* theta, lapack_complex_float* u1, lapack_int ldu1, lapack_complex_float* u2, lapack_int ldu2, lapack_complex_float* v1t, lapack_int ldv1t, lapack_complex_float* v2t, lapack_int ldv2t, lapack_complex_float* work, lapack_int lwork, float* rwork, lapack_int lrwork, lapack_int* iwork ) { lapack_int info = 0; /* LAPACK function works with matrices in both layouts. It is supported * through TRANS parameter. So all conversion between layouts can be * completed in LAPACK function. See the table below which describes how * every LAPACKE call is forwarded to corresponding LAPACK call. * * matrix_layout | trans_LAPACKE | -> trans_LAPACK * | (trans) | (ltrans) * -----------------+---------------+---------------- * LAPACK_COL_MAJOR | 'N' | -> 'N' * LAPACK_COL_MAJOR | 'T' | -> 'T' * LAPACK_ROW_MAJOR | 'N' | -> 'T' * LAPACK_ROW_MAJOR | 'T' | -> 'T' * (note that for row major layout trans parameter is ignored) */ if( matrix_layout == LAPACK_COL_MAJOR || matrix_layout == LAPACK_ROW_MAJOR ) { char ltrans; if( !LAPACKE_lsame( trans, 't' ) && matrix_layout == LAPACK_COL_MAJOR ) { ltrans = 'n'; } else { ltrans = 't'; } /* Call LAPACK function and adjust info */ LAPACK_cuncsd( &jobu1, &jobu2, &jobv1t, &jobv2t, <rans, &signs, &m, &p, &q, x11, &ldx11, x12, &ldx12, x21, &ldx21, x22, &ldx22, theta, u1, &ldu1, u2, &ldu2, v1t, &ldv1t, v2t, &ldv2t, work, &lwork, rwork, &lrwork, iwork, &info ); if( info < 0 ) { info = info - 1; } } else { info = -1; LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); } return info; }
lapack_int LAPACKE_cuncsd_work( int matrix_order, char jobu1, char jobu2, char jobv1t, char jobv2t, char trans, char signs, lapack_int m, lapack_int p, lapack_int q, lapack_complex_float* x11, lapack_int ldx11, lapack_complex_float* x12, lapack_int ldx12, lapack_complex_float* x21, lapack_int ldx21, lapack_complex_float* x22, lapack_int ldx22, float* theta, lapack_complex_float* u1, lapack_int ldu1, lapack_complex_float* u2, lapack_int ldu2, lapack_complex_float* v1t, lapack_int ldv1t, lapack_complex_float* v2t, lapack_int ldv2t, lapack_complex_float* work, lapack_int lwork, float* rwork, lapack_int lrwork, lapack_int* iwork ) { lapack_int info = 0; if( matrix_order == LAPACK_COL_MAJOR ) { /* Call LAPACK function and adjust info */ LAPACK_cuncsd( &jobu1, &jobu2, &jobv1t, &jobv2t, &trans, &signs, &m, &p, &q, x11, &ldx11, x12, &ldx12, x21, &ldx21, x22, &ldx22, theta, u1, &ldu1, u2, &ldu2, v1t, &ldv1t, v2t, &ldv2t, work, &lwork, rwork, &lrwork, iwork, &info ); if( info < 0 ) { info = info - 1; } } else if( matrix_order == LAPACK_ROW_MAJOR ) { lapack_int nrows_x11 = ( LAPACKE_lsame( trans, 'n' ) ? p : q); lapack_int nrows_x12 = ( LAPACKE_lsame( trans, 'n' ) ? p : m-q); lapack_int nrows_x21 = ( LAPACKE_lsame( trans, 'n' ) ? m-p : q); lapack_int nrows_x22 = ( LAPACKE_lsame( trans, 'n' ) ? m-p : m-q); lapack_int nrows_u1 = ( LAPACKE_lsame( jobu1, 'y' ) ? p : 1); lapack_int nrows_u2 = ( LAPACKE_lsame( jobu2, 'y' ) ? m-p : 1); lapack_int nrows_v1t = ( LAPACKE_lsame( jobv1t, 'y' ) ? q : 1); lapack_int nrows_v2t = ( LAPACKE_lsame( jobv2t, 'y' ) ? m-q : 1); lapack_int ldu1_t = MAX(1,nrows_u1); lapack_int ldu2_t = MAX(1,nrows_u2); lapack_int ldv1t_t = MAX(1,nrows_v1t); lapack_int ldv2t_t = MAX(1,nrows_v2t); lapack_int ldx11_t = MAX(1,nrows_x11); lapack_int ldx12_t = MAX(1,nrows_x12); lapack_int ldx21_t = MAX(1,nrows_x21); lapack_int ldx22_t = MAX(1,nrows_x22); lapack_complex_float* x11_t = NULL; lapack_complex_float* x12_t = NULL; lapack_complex_float* x21_t = NULL; lapack_complex_float* x22_t = NULL; lapack_complex_float* u1_t = NULL; lapack_complex_float* u2_t = NULL; lapack_complex_float* v1t_t = NULL; lapack_complex_float* v2t_t = NULL; /* Check leading dimension(s) */ if( ldu1 < p ) { info = -21; LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); return info; } if( ldu2 < m-p ) { info = -23; LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); return info; } if( ldv1t < q ) { info = -25; LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); return info; } if( ldv2t < m-q ) { info = -27; LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); return info; } if( ldx11 < q ) { info = -12; LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); return info; } if( ldx12 < m-q ) { info = -14; LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); return info; } if( ldx21 < q ) { info = -16; LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); return info; } if( ldx22 < m-q ) { info = -18; LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); return info; } /* Query optimal working array(s) size if requested */ if( lrwork == -1 || lwork == -1 ) { LAPACK_cuncsd( &jobu1, &jobu2, &jobv1t, &jobv2t, &trans, &signs, &m, &p, &q, x11, &ldx11_t, x12, &ldx12_t, x21, &ldx21_t, x22, &ldx22_t, theta, u1, &ldu1_t, u2, &ldu2_t, v1t, &ldv1t_t, v2t, &ldv2t_t, work, &lwork, rwork, &lrwork, iwork, &info ); return (info < 0) ? (info - 1) : info; } /* Allocate memory for temporary array(s) */ x11_t = (lapack_complex_float*) LAPACKE_malloc( sizeof(lapack_complex_float) * ldx11_t * MAX(1,q) ); if( x11_t == NULL ) { info = LAPACK_TRANSPOSE_MEMORY_ERROR; goto exit_level_0; } x12_t = (lapack_complex_float*) LAPACKE_malloc( sizeof(lapack_complex_float) * ldx12_t * MAX(1,m-q) ); if( x12_t == NULL ) { info = LAPACK_TRANSPOSE_MEMORY_ERROR; goto exit_level_1; } x21_t = (lapack_complex_float*) LAPACKE_malloc( sizeof(lapack_complex_float) * ldx21_t * MAX(1,q) ); if( x21_t == NULL ) { info = LAPACK_TRANSPOSE_MEMORY_ERROR; goto exit_level_2; } x22_t = (lapack_complex_float*) LAPACKE_malloc( sizeof(lapack_complex_float) * ldx22_t * MAX(1,m-q) ); if( x22_t == NULL ) { info = LAPACK_TRANSPOSE_MEMORY_ERROR; goto exit_level_3; } if( LAPACKE_lsame( jobu1, 'y' ) ) { u1_t = (lapack_complex_float*) LAPACKE_malloc( sizeof(lapack_complex_float) * ldu1_t * MAX(1,p) ); if( u1_t == NULL ) { info = LAPACK_TRANSPOSE_MEMORY_ERROR; goto exit_level_4; } } if( LAPACKE_lsame( jobu2, 'y' ) ) { u2_t = (lapack_complex_float*) LAPACKE_malloc( sizeof(lapack_complex_float) * ldu2_t * MAX(1,m-p) ); if( u2_t == NULL ) { info = LAPACK_TRANSPOSE_MEMORY_ERROR; goto exit_level_5; } } if( LAPACKE_lsame( jobv1t, 'y' ) ) { v1t_t = (lapack_complex_float*) LAPACKE_malloc( sizeof(lapack_complex_float) * ldv1t_t * MAX(1,q) ); if( v1t_t == NULL ) { info = LAPACK_TRANSPOSE_MEMORY_ERROR; goto exit_level_6; } } if( LAPACKE_lsame( jobv2t, 'y' ) ) { v2t_t = (lapack_complex_float*) LAPACKE_malloc( sizeof(lapack_complex_float) * ldv2t_t * MAX(1,m-q) ); if( v2t_t == NULL ) { info = LAPACK_TRANSPOSE_MEMORY_ERROR; goto exit_level_7; } } /* Transpose input matrices */ LAPACKE_cge_trans( matrix_order, nrows_x11, q, x11, ldx11, x11_t, ldx11_t ); LAPACKE_cge_trans( matrix_order, nrows_x12, m-q, x12, ldx12, x12_t, ldx12_t ); LAPACKE_cge_trans( matrix_order, nrows_x21, q, x21, ldx21, x21_t, ldx21_t ); LAPACKE_cge_trans( matrix_order, nrows_x22, m-q, x22, ldx22, x22_t, ldx22_t ); /* Call LAPACK function and adjust info */ LAPACK_cuncsd( &jobu1, &jobu2, &jobv1t, &jobv2t, &trans, &signs, &m, &p, &q, x11_t, &ldx11_t, x12_t, &ldx12_t, x21_t, &ldx21_t, x22_t, &ldx22_t, theta, u1_t, &ldu1_t, u2_t, &ldu2_t, v1t_t, &ldv1t_t, v2t_t, &ldv2t_t, work, &lwork, rwork, &lrwork, iwork, &info ); if( info < 0 ) { info = info - 1; } /* Transpose output matrices */ LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_x11, q, x11_t, ldx11_t, x11, ldx11 ); LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_x12, m-q, x12_t, ldx12_t, x12, ldx12 ); LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_x21, q, x21_t, ldx21_t, x21, ldx21 ); LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_x22, m-q, x22_t, ldx22_t, x22, ldx22 ); if( LAPACKE_lsame( jobu1, 'y' ) ) { LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_u1, p, u1_t, ldu1_t, u1, ldu1 ); } if( LAPACKE_lsame( jobu2, 'y' ) ) { LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_u2, m-p, u2_t, ldu2_t, u2, ldu2 ); } if( LAPACKE_lsame( jobv1t, 'y' ) ) { LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_v1t, q, v1t_t, ldv1t_t, v1t, ldv1t ); } if( LAPACKE_lsame( jobv2t, 'y' ) ) { LAPACKE_cge_trans( LAPACK_COL_MAJOR, nrows_v2t, m-q, v2t_t, ldv2t_t, v2t, ldv2t ); } /* Release memory and exit */ if( LAPACKE_lsame( jobv2t, 'y' ) ) { LAPACKE_free( v2t_t ); } exit_level_7: if( LAPACKE_lsame( jobv1t, 'y' ) ) { LAPACKE_free( v1t_t ); } exit_level_6: if( LAPACKE_lsame( jobu2, 'y' ) ) { LAPACKE_free( u2_t ); } exit_level_5: if( LAPACKE_lsame( jobu1, 'y' ) ) { LAPACKE_free( u1_t ); } exit_level_4: LAPACKE_free( x22_t ); exit_level_3: LAPACKE_free( x21_t ); exit_level_2: LAPACKE_free( x12_t ); exit_level_1: LAPACKE_free( x11_t ); exit_level_0: if( info == LAPACK_TRANSPOSE_MEMORY_ERROR ) { LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); } } else { info = -1; LAPACKE_xerbla( "LAPACKE_cuncsd_work", info ); } return info; }