00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013 #include "f2c.h"
00014 #include "blaswrap.h"
00015
00016
00017
00018 static integer c__1 = 1;
00019 static real c_b12 = -1.f;
00020 static real c_b14 = 1.f;
00021
00022 int sporfs_(char *uplo, integer *n, integer *nrhs, real *a,
00023 integer *lda, real *af, integer *ldaf, real *b, integer *ldb, real *x,
00024 integer *ldx, real *ferr, real *berr, real *work, integer *iwork,
00025 integer *info)
00026 {
00027
00028 integer a_dim1, a_offset, af_dim1, af_offset, b_dim1, b_offset, x_dim1,
00029 x_offset, i__1, i__2, i__3;
00030 real r__1, r__2, r__3;
00031
00032
00033 integer i__, j, k;
00034 real s, xk;
00035 integer nz;
00036 real eps;
00037 integer kase;
00038 real safe1, safe2;
00039 extern logical lsame_(char *, char *);
00040 integer isave[3], count;
00041 logical upper;
00042 extern int scopy_(integer *, real *, integer *, real *,
00043 integer *), saxpy_(integer *, real *, real *, integer *, real *,
00044 integer *), ssymv_(char *, integer *, real *, real *, integer *,
00045 real *, integer *, real *, real *, integer *), slacn2_(
00046 integer *, real *, real *, integer *, real *, integer *, integer *
00047 );
00048 extern doublereal slamch_(char *);
00049 real safmin;
00050 extern int xerbla_(char *, integer *);
00051 real lstres;
00052 extern int spotrs_(char *, integer *, integer *, real *,
00053 integer *, real *, integer *, integer *);
00054
00055
00056
00057
00058
00059
00060
00061
00062
00063
00064
00065
00066
00067
00068
00069
00070
00071
00072
00073
00074
00075
00076
00077
00078
00079
00080
00081
00082
00083
00084
00085
00086
00087
00088
00089
00090
00091
00092
00093
00094
00095
00096
00097
00098
00099
00100
00101
00102
00103
00104
00105
00106
00107
00108
00109
00110
00111
00112
00113
00114
00115
00116
00117
00118
00119
00120
00121
00122
00123
00124
00125
00126
00127
00128
00129
00130
00131
00132
00133
00134
00135
00136
00137
00138
00139
00140
00141
00142
00143
00144
00145
00146
00147
00148
00149
00150
00151
00152
00153
00154
00155
00156
00157
00158
00159
00160
00161
00162
00163
00164
00165
00166
00167
00168 a_dim1 = *lda;
00169 a_offset = 1 + a_dim1;
00170 a -= a_offset;
00171 af_dim1 = *ldaf;
00172 af_offset = 1 + af_dim1;
00173 af -= af_offset;
00174 b_dim1 = *ldb;
00175 b_offset = 1 + b_dim1;
00176 b -= b_offset;
00177 x_dim1 = *ldx;
00178 x_offset = 1 + x_dim1;
00179 x -= x_offset;
00180 --ferr;
00181 --berr;
00182 --work;
00183 --iwork;
00184
00185
00186 *info = 0;
00187 upper = lsame_(uplo, "U");
00188 if (! upper && ! lsame_(uplo, "L")) {
00189 *info = -1;
00190 } else if (*n < 0) {
00191 *info = -2;
00192 } else if (*nrhs < 0) {
00193 *info = -3;
00194 } else if (*lda < max(1,*n)) {
00195 *info = -5;
00196 } else if (*ldaf < max(1,*n)) {
00197 *info = -7;
00198 } else if (*ldb < max(1,*n)) {
00199 *info = -9;
00200 } else if (*ldx < max(1,*n)) {
00201 *info = -11;
00202 }
00203 if (*info != 0) {
00204 i__1 = -(*info);
00205 xerbla_("SPORFS", &i__1);
00206 return 0;
00207 }
00208
00209
00210
00211 if (*n == 0 || *nrhs == 0) {
00212 i__1 = *nrhs;
00213 for (j = 1; j <= i__1; ++j) {
00214 ferr[j] = 0.f;
00215 berr[j] = 0.f;
00216
00217 }
00218 return 0;
00219 }
00220
00221
00222
00223 nz = *n + 1;
00224 eps = slamch_("Epsilon");
00225 safmin = slamch_("Safe minimum");
00226 safe1 = nz * safmin;
00227 safe2 = safe1 / eps;
00228
00229
00230
00231 i__1 = *nrhs;
00232 for (j = 1; j <= i__1; ++j) {
00233
00234 count = 1;
00235 lstres = 3.f;
00236 L20:
00237
00238
00239
00240
00241
00242 scopy_(n, &b[j * b_dim1 + 1], &c__1, &work[*n + 1], &c__1);
00243 ssymv_(uplo, n, &c_b12, &a[a_offset], lda, &x[j * x_dim1 + 1], &c__1,
00244 &c_b14, &work[*n + 1], &c__1);
00245
00246
00247
00248
00249
00250
00251
00252
00253
00254
00255 i__2 = *n;
00256 for (i__ = 1; i__ <= i__2; ++i__) {
00257 work[i__] = (r__1 = b[i__ + j * b_dim1], dabs(r__1));
00258
00259 }
00260
00261
00262
00263 if (upper) {
00264 i__2 = *n;
00265 for (k = 1; k <= i__2; ++k) {
00266 s = 0.f;
00267 xk = (r__1 = x[k + j * x_dim1], dabs(r__1));
00268 i__3 = k - 1;
00269 for (i__ = 1; i__ <= i__3; ++i__) {
00270 work[i__] += (r__1 = a[i__ + k * a_dim1], dabs(r__1)) *
00271 xk;
00272 s += (r__1 = a[i__ + k * a_dim1], dabs(r__1)) * (r__2 = x[
00273 i__ + j * x_dim1], dabs(r__2));
00274
00275 }
00276 work[k] = work[k] + (r__1 = a[k + k * a_dim1], dabs(r__1)) *
00277 xk + s;
00278
00279 }
00280 } else {
00281 i__2 = *n;
00282 for (k = 1; k <= i__2; ++k) {
00283 s = 0.f;
00284 xk = (r__1 = x[k + j * x_dim1], dabs(r__1));
00285 work[k] += (r__1 = a[k + k * a_dim1], dabs(r__1)) * xk;
00286 i__3 = *n;
00287 for (i__ = k + 1; i__ <= i__3; ++i__) {
00288 work[i__] += (r__1 = a[i__ + k * a_dim1], dabs(r__1)) *
00289 xk;
00290 s += (r__1 = a[i__ + k * a_dim1], dabs(r__1)) * (r__2 = x[
00291 i__ + j * x_dim1], dabs(r__2));
00292
00293 }
00294 work[k] += s;
00295
00296 }
00297 }
00298 s = 0.f;
00299 i__2 = *n;
00300 for (i__ = 1; i__ <= i__2; ++i__) {
00301 if (work[i__] > safe2) {
00302
00303 r__2 = s, r__3 = (r__1 = work[*n + i__], dabs(r__1)) / work[
00304 i__];
00305 s = dmax(r__2,r__3);
00306 } else {
00307
00308 r__2 = s, r__3 = ((r__1 = work[*n + i__], dabs(r__1)) + safe1)
00309 / (work[i__] + safe1);
00310 s = dmax(r__2,r__3);
00311 }
00312
00313 }
00314 berr[j] = s;
00315
00316
00317
00318
00319
00320
00321
00322 if (berr[j] > eps && berr[j] * 2.f <= lstres && count <= 5) {
00323
00324
00325
00326 spotrs_(uplo, n, &c__1, &af[af_offset], ldaf, &work[*n + 1], n,
00327 info);
00328 saxpy_(n, &c_b14, &work[*n + 1], &c__1, &x[j * x_dim1 + 1], &c__1)
00329 ;
00330 lstres = berr[j];
00331 ++count;
00332 goto L20;
00333 }
00334
00335
00336
00337
00338
00339
00340
00341
00342
00343
00344
00345
00346
00347
00348
00349
00350
00351
00352
00353
00354
00355
00356
00357 i__2 = *n;
00358 for (i__ = 1; i__ <= i__2; ++i__) {
00359 if (work[i__] > safe2) {
00360 work[i__] = (r__1 = work[*n + i__], dabs(r__1)) + nz * eps *
00361 work[i__];
00362 } else {
00363 work[i__] = (r__1 = work[*n + i__], dabs(r__1)) + nz * eps *
00364 work[i__] + safe1;
00365 }
00366
00367 }
00368
00369 kase = 0;
00370 L100:
00371 slacn2_(n, &work[(*n << 1) + 1], &work[*n + 1], &iwork[1], &ferr[j], &
00372 kase, isave);
00373 if (kase != 0) {
00374 if (kase == 1) {
00375
00376
00377
00378 spotrs_(uplo, n, &c__1, &af[af_offset], ldaf, &work[*n + 1],
00379 n, info);
00380 i__2 = *n;
00381 for (i__ = 1; i__ <= i__2; ++i__) {
00382 work[*n + i__] = work[i__] * work[*n + i__];
00383
00384 }
00385 } else if (kase == 2) {
00386
00387
00388
00389 i__2 = *n;
00390 for (i__ = 1; i__ <= i__2; ++i__) {
00391 work[*n + i__] = work[i__] * work[*n + i__];
00392
00393 }
00394 spotrs_(uplo, n, &c__1, &af[af_offset], ldaf, &work[*n + 1],
00395 n, info);
00396 }
00397 goto L100;
00398 }
00399
00400
00401
00402 lstres = 0.f;
00403 i__2 = *n;
00404 for (i__ = 1; i__ <= i__2; ++i__) {
00405
00406 r__2 = lstres, r__3 = (r__1 = x[i__ + j * x_dim1], dabs(r__1));
00407 lstres = dmax(r__2,r__3);
00408
00409 }
00410 if (lstres != 0.f) {
00411 ferr[j] /= lstres;
00412 }
00413
00414
00415 }
00416
00417 return 0;
00418
00419
00420
00421 }