|
- /*****************************************************************************
- Copyright (c) 2014, Intel Corp.
- All rights reserved.
-
- Redistribution and use in source and binary forms, with or without
- modification, are permitted provided that the following conditions are met:
-
- * Redistributions of source code must retain the above copyright notice,
- this list of conditions and the following disclaimer.
- * Redistributions in binary form must reproduce the above copyright
- notice, this list of conditions and the following disclaimer in the
- documentation and/or other materials provided with the distribution.
- * Neither the name of Intel Corporation nor the names of its contributors
- may be used to endorse or promote products derived from this software
- without specific prior written permission.
-
- THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
- AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
- LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
- CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
- SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
- INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
- CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
- ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
- THE POSSIBILITY OF SUCH DAMAGE.
- *****************************************************************************
- * Contents: Native middle-level C interface to LAPACK function zuncsd2by1
- * Author: Intel Corporation
- *****************************************************************************/
-
- #include "lapacke_utils.h"
-
- lapack_int LAPACKE_zuncsd2by1_work( int matrix_layout, char jobu1, char jobu2,
- char jobv1t, lapack_int m, lapack_int p,
- lapack_int q, lapack_complex_double* x11, lapack_int ldx11,
- lapack_complex_double* x21, lapack_int ldx21,
- double* theta, lapack_complex_double* u1,
- lapack_int ldu1, lapack_complex_double* u2,
- lapack_int ldu2, lapack_complex_double* v1t,
- lapack_int ldv1t, lapack_complex_double* work,
- lapack_int lwork, double* rwork, lapack_int lrwork,
- lapack_int* iwork )
- {
- lapack_int info = 0;
- if( matrix_layout == LAPACK_COL_MAJOR ) {
- /* Call LAPACK function and adjust info */
- LAPACK_zuncsd2by1( &jobu1, &jobu2, &jobv1t, &m, &p,
- &q, x11, &ldx11, x21, &ldx21,
- theta, u1, &ldu1, u2, &ldu2, v1t, &ldv1t,
- work, &lwork, rwork, &lrwork, iwork, &info );
- if( info < 0 ) {
- info = info - 1;
- }
- } else if( matrix_layout == LAPACK_ROW_MAJOR ) {
- lapack_int nrows_x11 = p;
- lapack_int nrows_x21 = m-p;
- lapack_int nrows_u1 = ( LAPACKE_lsame( jobu1, 'y' ) ? p : 1);
- lapack_int nrows_u2 = ( LAPACKE_lsame( jobu2, 'y' ) ? m-p : 1);
- lapack_int nrows_v1t = ( LAPACKE_lsame( jobv1t, 'y' ) ? q : 1);
- lapack_int ldu1_t = MAX(1,nrows_u1);
- lapack_int ldu2_t = MAX(1,nrows_u2);
- lapack_int ldv1t_t = MAX(1,nrows_v1t);
- lapack_int ldx11_t = MAX(1,nrows_x11);
- lapack_int ldx21_t = MAX(1,nrows_x21);
- lapack_complex_double* x11_t = NULL;
- lapack_complex_double* x21_t = NULL;
- lapack_complex_double* u1_t = NULL;
- lapack_complex_double* u2_t = NULL;
- lapack_complex_double* v1t_t = NULL;
- /* Check leading dimension(s) */
- if( ldu1 < p ) {
- info = -21;
- LAPACKE_xerbla( "LAPACKE_zuncsd2by1_work", info );
- return info;
- }
- if( ldu2 < m-p ) {
- info = -23;
- LAPACKE_xerbla( "LAPACKE_zuncsd2by1_work", info );
- return info;
- }
- if( ldv1t < q ) {
- info = -25;
- LAPACKE_xerbla( "LAPACKE_zuncsd2by1_work", info );
- return info;
- }
- if( ldx11 < q ) {
- info = -12;
- LAPACKE_xerbla( "LAPACKE_zuncsd2by1_work", info );
- return info;
- }
- if( ldx21 < q ) {
- info = -16;
- LAPACKE_xerbla( "LAPACKE_zuncsd2by1_work", info );
- return info;
- }
- /* Query optimal working array(s) size if requested */
- if( lrwork == -1 || lwork == -1 ) {
- LAPACK_zuncsd2by1( &jobu1, &jobu2, &jobv1t, &m, &p,
- &q, x11, &ldx11_t, x21, &ldx21_t,
- theta, u1, &ldu1_t, u2, &ldu2_t, v1t, &ldv1t_t,
- work, &lwork, rwork, &lrwork, iwork, &info );
- return (info < 0) ? (info - 1) : info;
- }
- /* Allocate memory for temporary array(s) */
- x11_t = (lapack_complex_double*)LAPACKE_malloc( sizeof(lapack_complex_double) * ldx11_t * MAX(1,q) );
- if( x11_t == NULL ) {
- info = LAPACK_TRANSPOSE_MEMORY_ERROR;
- goto exit_level_0;
- }
- x21_t = (lapack_complex_double*)LAPACKE_malloc( sizeof(lapack_complex_double) * ldx21_t * MAX(1,q) );
- if( x21_t == NULL ) {
- info = LAPACK_TRANSPOSE_MEMORY_ERROR;
- goto exit_level_1;
- }
- if( LAPACKE_lsame( jobu1, 'y' ) ) {
- u1_t = (lapack_complex_double*)
- LAPACKE_malloc( sizeof(lapack_complex_double) * ldu1_t * MAX(1,p) );
- if( u1_t == NULL ) {
- info = LAPACK_TRANSPOSE_MEMORY_ERROR;
- goto exit_level_2;
- }
- }
- if( LAPACKE_lsame( jobu2, 'y' ) ) {
- u2_t = (lapack_complex_double*)
- LAPACKE_malloc( sizeof(lapack_complex_double) * ldu2_t * MAX(1,m-p) );
- if( u2_t == NULL ) {
- info = LAPACK_TRANSPOSE_MEMORY_ERROR;
- goto exit_level_3;
- }
- }
- if( LAPACKE_lsame( jobv1t, 'y' ) ) {
- v1t_t = (lapack_complex_double*)
- LAPACKE_malloc( sizeof(lapack_complex_double) * ldv1t_t * MAX(1,q) );
- if( v1t_t == NULL ) {
- info = LAPACK_TRANSPOSE_MEMORY_ERROR;
- goto exit_level_4;
- }
- }
- /* Transpose input matrices */
- LAPACKE_zge_trans( matrix_layout, nrows_x11, q, x11, ldx11, x11_t,
- ldx11_t );
- LAPACKE_zge_trans( matrix_layout, nrows_x21, q, x21, ldx21, x21_t,
- ldx21_t );
- /* Call LAPACK function and adjust info */
- LAPACK_zuncsd2by1( &jobu1, &jobu2, &jobv1t, &m, &p,
- &q, x11_t, &ldx11_t, x21_t, &ldx21_t,
- theta, u1_t, &ldu1_t, u2_t, &ldu2_t, v1t_t, &ldv1t_t,
- work, &lwork, rwork, &lrwork, iwork, &info );
- if( info < 0 ) {
- info = info - 1;
- }
- /* Transpose output matrices */
- LAPACKE_zge_trans( LAPACK_COL_MAJOR, nrows_x11, q, x11_t, ldx11_t, x11,
- ldx11 );
- LAPACKE_zge_trans( LAPACK_COL_MAJOR, nrows_x21, q, x21_t, ldx21_t, x21,
- ldx21 );
- if( LAPACKE_lsame( jobu1, 'y' ) ) {
- LAPACKE_zge_trans( LAPACK_COL_MAJOR, nrows_u1, p, u1_t, ldu1_t, u1,
- ldu1 );
- }
- if( LAPACKE_lsame( jobu2, 'y' ) ) {
- LAPACKE_zge_trans( LAPACK_COL_MAJOR, nrows_u2, m-p, u2_t, ldu2_t,
- u2, ldu2 );
- }
- if( LAPACKE_lsame( jobv1t, 'y' ) ) {
- LAPACKE_zge_trans( LAPACK_COL_MAJOR, nrows_v1t, q, v1t_t, ldv1t_t,
- v1t, ldv1t );
- }
- /* Release memory and exit */
- if( LAPACKE_lsame( jobv1t, 'y' ) ) {
- LAPACKE_free( v1t_t );
- }
- exit_level_4:
- if( LAPACKE_lsame( jobu2, 'y' ) ) {
- LAPACKE_free( u2_t );
- }
- exit_level_3:
- if( LAPACKE_lsame( jobu1, 'y' ) ) {
- LAPACKE_free( u1_t );
- }
- exit_level_2:
- LAPACKE_free( x21_t );
- exit_level_1:
- LAPACKE_free( x11_t );
- exit_level_0:
- if( info == LAPACK_TRANSPOSE_MEMORY_ERROR ) {
- LAPACKE_xerbla( "LAPACKE_zuncsd2by1_work", info );
- }
- } else {
- info = -1;
- LAPACKE_xerbla( "LAPACKE_zuncsd2by1_work", info );
- }
- return info;
- }
|