00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022
00023
00024
00025
00026
00027
00028
00029
00030
00031
00032
00033
00034
00035
00036
00037
00038
00039
00040
00041
00042
00043
00044
00045
00046
00047
00048
00049 #include <stdio.h>
00050 #include "lapacke.h"
00051 #include "lapacke_utils.h"
00052 #include "test_utils.h"
00053
00054 static void init_scalars_cunmqr( char *side, char *trans, lapack_int *m,
00055 lapack_int *n, lapack_int *k, lapack_int *lda,
00056 lapack_int *ldc, lapack_int *lwork );
00057 static void init_a( lapack_int size, lapack_complex_float *a );
00058 static void init_tau( lapack_int size, lapack_complex_float *tau );
00059 static void init_c( lapack_int size, lapack_complex_float *c );
00060 static void init_work( lapack_int size, lapack_complex_float *work );
00061 static int compare_cunmqr( lapack_complex_float *c, lapack_complex_float *c_i,
00062 lapack_int info, lapack_int info_i, lapack_int ldc,
00063 lapack_int n );
00064
00065 int main(void)
00066 {
00067
00068 char side, side_i;
00069 char trans, trans_i;
00070 lapack_int m, m_i;
00071 lapack_int n, n_i;
00072 lapack_int k, k_i;
00073 lapack_int lda, lda_i;
00074 lapack_int lda_r;
00075 lapack_int ldc, ldc_i;
00076 lapack_int ldc_r;
00077 lapack_int lwork, lwork_i;
00078 lapack_int info, info_i;
00079
00080 lapack_int r;
00081 lapack_int i;
00082 int failed;
00083
00084
00085 lapack_complex_float *a = NULL, *a_i = NULL;
00086 lapack_complex_float *tau = NULL, *tau_i = NULL;
00087 lapack_complex_float *c = NULL, *c_i = NULL;
00088 lapack_complex_float *work = NULL, *work_i = NULL;
00089 lapack_complex_float *c_save = NULL;
00090 lapack_complex_float *a_r = NULL;
00091 lapack_complex_float *c_r = NULL;
00092
00093
00094 init_scalars_cunmqr( &side, &trans, &m, &n, &k, &lda, &ldc, &lwork );
00095 r = LAPACKE_lsame( side, 'l' ) ? m : n;
00096 lda_r = k+2;
00097 ldc_r = n+2;
00098 side_i = side;
00099 trans_i = trans;
00100 m_i = m;
00101 n_i = n;
00102 k_i = k;
00103 lda_i = lda;
00104 ldc_i = ldc;
00105 lwork_i = lwork;
00106
00107
00108 a = (lapack_complex_float *)
00109 LAPACKE_malloc( lda*k * sizeof(lapack_complex_float) );
00110 tau = (lapack_complex_float *)
00111 LAPACKE_malloc( k * sizeof(lapack_complex_float) );
00112 c = (lapack_complex_float *)
00113 LAPACKE_malloc( ldc*n * sizeof(lapack_complex_float) );
00114 work = (lapack_complex_float *)
00115 LAPACKE_malloc( lwork * sizeof(lapack_complex_float) );
00116
00117
00118 a_i = (lapack_complex_float *)
00119 LAPACKE_malloc( lda*k * sizeof(lapack_complex_float) );
00120 tau_i = (lapack_complex_float *)
00121 LAPACKE_malloc( k * sizeof(lapack_complex_float) );
00122 c_i = (lapack_complex_float *)
00123 LAPACKE_malloc( ldc*n * sizeof(lapack_complex_float) );
00124 work_i = (lapack_complex_float *)
00125 LAPACKE_malloc( lwork * sizeof(lapack_complex_float) );
00126
00127
00128 c_save = (lapack_complex_float *)
00129 LAPACKE_malloc( ldc*n * sizeof(lapack_complex_float) );
00130
00131
00132 a_r = (lapack_complex_float *)
00133 LAPACKE_malloc( r*(k+2) * sizeof(lapack_complex_float) );
00134 c_r = (lapack_complex_float *)
00135 LAPACKE_malloc( m*(n+2) * sizeof(lapack_complex_float) );
00136
00137
00138 init_a( lda*k, a );
00139 init_tau( k, tau );
00140 init_c( ldc*n, c );
00141 init_work( lwork, work );
00142
00143
00144 for( i = 0; i < ldc*n; i++ ) {
00145 c_save[i] = c[i];
00146 }
00147
00148
00149 cunmqr_( &side, &trans, &m, &n, &k, a, &lda, tau, c, &ldc, work, &lwork,
00150 &info );
00151
00152
00153
00154 for( i = 0; i < lda*k; i++ ) {
00155 a_i[i] = a[i];
00156 }
00157 for( i = 0; i < k; i++ ) {
00158 tau_i[i] = tau[i];
00159 }
00160 for( i = 0; i < ldc*n; i++ ) {
00161 c_i[i] = c_save[i];
00162 }
00163 for( i = 0; i < lwork; i++ ) {
00164 work_i[i] = work[i];
00165 }
00166 info_i = LAPACKE_cunmqr_work( LAPACK_COL_MAJOR, side_i, trans_i, m_i, n_i,
00167 k_i, a_i, lda_i, tau_i, c_i, ldc_i, work_i,
00168 lwork_i );
00169
00170 failed = compare_cunmqr( c, c_i, info, info_i, ldc, n );
00171 if( failed == 0 ) {
00172 printf( "PASSED: column-major middle-level interface to cunmqr\n" );
00173 } else {
00174 printf( "FAILED: column-major middle-level interface to cunmqr\n" );
00175 }
00176
00177
00178
00179 for( i = 0; i < lda*k; i++ ) {
00180 a_i[i] = a[i];
00181 }
00182 for( i = 0; i < k; i++ ) {
00183 tau_i[i] = tau[i];
00184 }
00185 for( i = 0; i < ldc*n; i++ ) {
00186 c_i[i] = c_save[i];
00187 }
00188 for( i = 0; i < lwork; i++ ) {
00189 work_i[i] = work[i];
00190 }
00191 info_i = LAPACKE_cunmqr( LAPACK_COL_MAJOR, side_i, trans_i, m_i, n_i, k_i,
00192 a_i, lda_i, tau_i, c_i, ldc_i );
00193
00194 failed = compare_cunmqr( c, c_i, info, info_i, ldc, n );
00195 if( failed == 0 ) {
00196 printf( "PASSED: column-major high-level interface to cunmqr\n" );
00197 } else {
00198 printf( "FAILED: column-major high-level interface to cunmqr\n" );
00199 }
00200
00201
00202
00203 for( i = 0; i < lda*k; i++ ) {
00204 a_i[i] = a[i];
00205 }
00206 for( i = 0; i < k; i++ ) {
00207 tau_i[i] = tau[i];
00208 }
00209 for( i = 0; i < ldc*n; i++ ) {
00210 c_i[i] = c_save[i];
00211 }
00212 for( i = 0; i < lwork; i++ ) {
00213 work_i[i] = work[i];
00214 }
00215
00216 LAPACKE_cge_trans( LAPACK_COL_MAJOR, r, k, a_i, lda, a_r, k+2 );
00217 LAPACKE_cge_trans( LAPACK_COL_MAJOR, m, n, c_i, ldc, c_r, n+2 );
00218 info_i = LAPACKE_cunmqr_work( LAPACK_ROW_MAJOR, side_i, trans_i, m_i, n_i,
00219 k_i, a_r, lda_r, tau_i, c_r, ldc_r, work_i,
00220 lwork_i );
00221
00222 LAPACKE_cge_trans( LAPACK_ROW_MAJOR, m, n, c_r, n+2, c_i, ldc );
00223
00224 failed = compare_cunmqr( c, c_i, info, info_i, ldc, n );
00225 if( failed == 0 ) {
00226 printf( "PASSED: row-major middle-level interface to cunmqr\n" );
00227 } else {
00228 printf( "FAILED: row-major middle-level interface to cunmqr\n" );
00229 }
00230
00231
00232
00233 for( i = 0; i < lda*k; i++ ) {
00234 a_i[i] = a[i];
00235 }
00236 for( i = 0; i < k; i++ ) {
00237 tau_i[i] = tau[i];
00238 }
00239 for( i = 0; i < ldc*n; i++ ) {
00240 c_i[i] = c_save[i];
00241 }
00242 for( i = 0; i < lwork; i++ ) {
00243 work_i[i] = work[i];
00244 }
00245
00246
00247 LAPACKE_cge_trans( LAPACK_COL_MAJOR, r, k, a_i, lda, a_r, k+2 );
00248 LAPACKE_cge_trans( LAPACK_COL_MAJOR, m, n, c_i, ldc, c_r, n+2 );
00249 info_i = LAPACKE_cunmqr( LAPACK_ROW_MAJOR, side_i, trans_i, m_i, n_i, k_i,
00250 a_r, lda_r, tau_i, c_r, ldc_r );
00251
00252 LAPACKE_cge_trans( LAPACK_ROW_MAJOR, m, n, c_r, n+2, c_i, ldc );
00253
00254 failed = compare_cunmqr( c, c_i, info, info_i, ldc, n );
00255 if( failed == 0 ) {
00256 printf( "PASSED: row-major high-level interface to cunmqr\n" );
00257 } else {
00258 printf( "FAILED: row-major high-level interface to cunmqr\n" );
00259 }
00260
00261
00262 if( a != NULL ) {
00263 LAPACKE_free( a );
00264 }
00265 if( a_i != NULL ) {
00266 LAPACKE_free( a_i );
00267 }
00268 if( a_r != NULL ) {
00269 LAPACKE_free( a_r );
00270 }
00271 if( tau != NULL ) {
00272 LAPACKE_free( tau );
00273 }
00274 if( tau_i != NULL ) {
00275 LAPACKE_free( tau_i );
00276 }
00277 if( c != NULL ) {
00278 LAPACKE_free( c );
00279 }
00280 if( c_i != NULL ) {
00281 LAPACKE_free( c_i );
00282 }
00283 if( c_r != NULL ) {
00284 LAPACKE_free( c_r );
00285 }
00286 if( c_save != NULL ) {
00287 LAPACKE_free( c_save );
00288 }
00289 if( work != NULL ) {
00290 LAPACKE_free( work );
00291 }
00292 if( work_i != NULL ) {
00293 LAPACKE_free( work_i );
00294 }
00295
00296 return 0;
00297 }
00298
00299
00300 static void init_scalars_cunmqr( char *side, char *trans, lapack_int *m,
00301 lapack_int *n, lapack_int *k, lapack_int *lda,
00302 lapack_int *ldc, lapack_int *lwork )
00303 {
00304 *side = 'L';
00305 *trans = 'C';
00306 *m = 6;
00307 *n = 2;
00308 *k = 4;
00309 *lda = 8;
00310 *ldc = 8;
00311 *lwork = 512;
00312
00313 return;
00314 }
00315
00316
00317 static void init_a( lapack_int size, lapack_complex_float *a ) {
00318 lapack_int i;
00319 for( i = 0; i < size; i++ ) {
00320 a[i] = lapack_make_complex_float( 0.0f, 0.0f );
00321 }
00322 a[0] = lapack_make_complex_float( -3.087005138e+000, 0.000000000e+000 );
00323 a[8] = lapack_make_complex_float( -4.884994030e-001, -1.141689062e+000 );
00324 a[16] = lapack_make_complex_float( 3.773559928e-001, -1.243729830e+000 );
00325 a[24] = lapack_make_complex_float( -8.551653028e-001, -7.073198557e-001 );
00326 a[1] = lapack_make_complex_float( -3.269784153e-001, 4.238066077e-001 );
00327 a[9] = lapack_make_complex_float( 1.516316056e+000, 0.000000000e+000 );
00328 a[17] = lapack_make_complex_float( 1.373054981e+000, -8.176293373e-001 );
00329 a[25] = lapack_make_complex_float( -2.508625686e-001, 8.203486204e-001 );
00330 a[2] = lapack_make_complex_float( 1.691724658e-001, -7.980476320e-002 );
00331 a[10] = lapack_make_complex_float( -4.537104368e-001, -6.491497159e-003 );
00332 a[18] = lapack_make_complex_float( -2.171345234e+000, 0.000000000e+000 );
00333 a[26] = lapack_make_complex_float( -2.272676229e-001, -2.957314849e-001 );
00334 a[3] = lapack_make_complex_float( -1.059736237e-001, 7.268618047e-002 );
00335 a[11] = lapack_make_complex_float( -2.734071612e-001, 9.780790657e-002 );
00336 a[19] = lapack_make_complex_float( -2.918227613e-001, 4.888080955e-001 );
00337 a[27] = lapack_make_complex_float( -2.353376150e+000, 0.000000000e+000 );
00338 a[4] = lapack_make_complex_float( 1.729396135e-001, 1.606326252e-001 );
00339 a[12] = lapack_make_complex_float( -3.236304522e-001, 1.230006963e-001 );
00340 a[20] = lapack_make_complex_float( 2.727684677e-001, 4.697696120e-002 );
00341 a[28] = lapack_make_complex_float( 7.054226995e-001, 2.515080869e-001 );
00342 a[5] = lapack_make_complex_float( 2.698996663e-001, -1.516707987e-002 );
00343 a[13] = lapack_make_complex_float( -1.645935327e-001, 3.389006853e-001 );
00344 a[21] = lapack_make_complex_float( 5.348393917e-001, 3.988290727e-001 );
00345 a[29] = lapack_make_complex_float( 2.703070045e-001, -7.268778235e-002 );
00346 }
00347 static void init_tau( lapack_int size, lapack_complex_float *tau ) {
00348 lapack_int i;
00349 for( i = 0; i < size; i++ ) {
00350 tau[i] = lapack_make_complex_float( 0.0f, 0.0f );
00351 }
00352 tau[0] = lapack_make_complex_float( 1.310981035e+000, -2.623902261e-001 );
00353 tau[1] = lapack_make_complex_float( 1.105103970e+000, -4.503625035e-001 );
00354 tau[2] = lapack_make_complex_float( 1.040251970e+000, 2.121757567e-001 );
00355 tau[3] = lapack_make_complex_float( 1.185958982e+000, 2.011836171e-001 );
00356 }
00357 static void init_c( lapack_int size, lapack_complex_float *c ) {
00358 lapack_int i;
00359 for( i = 0; i < size; i++ ) {
00360 c[i] = lapack_make_complex_float( 0.0f, 0.0f );
00361 }
00362 c[0] = lapack_make_complex_float( -1.539999962e+000, 7.599999905e-001 );
00363 c[8] = lapack_make_complex_float( 3.170000076e+000, -2.089999914e+000 );
00364 c[1] = lapack_make_complex_float( 1.199999973e-001, -1.919999957e+000 );
00365 c[9] = lapack_make_complex_float( -6.530000210e+000, 4.179999828e+000 );
00366 c[2] = lapack_make_complex_float( -9.079999924e+000, -4.309999943e+000 );
00367 c[10] = lapack_make_complex_float( 7.280000210e+000, 7.300000191e-001 );
00368 c[3] = lapack_make_complex_float( 7.489999771e+000, 3.650000095e+000 );
00369 c[11] = lapack_make_complex_float( 9.100000262e-001, -3.970000029e+000 );
00370 c[4] = lapack_make_complex_float( -5.630000114e+000, -2.119999886e+000 );
00371 c[12] = lapack_make_complex_float( -5.460000038e+000, -1.639999986e+000 );
00372 c[5] = lapack_make_complex_float( 2.369999886e+000, 8.029999733e+000 );
00373 c[13] = lapack_make_complex_float( -2.839999914e+000, -5.860000134e+000 );
00374 }
00375 static void init_work( lapack_int size, lapack_complex_float *work ) {
00376 lapack_int i;
00377 for( i = 0; i < size; i++ ) {
00378 work[i] = lapack_make_complex_float( 0.0f, 0.0f );
00379 }
00380 }
00381
00382
00383
00384 static int compare_cunmqr( lapack_complex_float *c, lapack_complex_float *c_i,
00385 lapack_int info, lapack_int info_i, lapack_int ldc,
00386 lapack_int n )
00387 {
00388 lapack_int i;
00389 int failed = 0;
00390 for( i = 0; i < ldc*n; i++ ) {
00391 failed += compare_complex_floats(c[i],c_i[i]);
00392 }
00393 failed += (info == info_i) ? 0 : 1;
00394 if( info != 0 || info_i != 0 ) {
00395 printf( "info=%d, info_i=%d\n",(int)info,(int)info_i );
00396 }
00397
00398 return failed;
00399 }