00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013 #include "f2c.h"
00014 #include "blaswrap.h"
00015
00016
00017
00018 static real c_b4 = -1.f;
00019 static real c_b5 = 1.f;
00020 static integer c__1 = 1;
00021 static real c_b38 = 0.f;
00022
00023 int slahr2_(integer *n, integer *k, integer *nb, real *a,
00024 integer *lda, real *tau, real *t, integer *ldt, real *y, integer *ldy)
00025 {
00026
00027 integer a_dim1, a_offset, t_dim1, t_offset, y_dim1, y_offset, i__1, i__2,
00028 i__3;
00029 real r__1;
00030
00031
00032 integer i__;
00033 real ei;
00034 extern int sscal_(integer *, real *, real *, integer *),
00035 sgemm_(char *, char *, integer *, integer *, integer *, real *,
00036 real *, integer *, real *, integer *, real *, real *, integer *), sgemv_(char *, integer *, integer *, real *,
00037 real *, integer *, real *, integer *, real *, real *, integer *), scopy_(integer *, real *, integer *, real *, integer *),
00038 strmm_(char *, char *, char *, char *, integer *, integer *, real
00039 *, real *, integer *, real *, integer *), saxpy_(integer *, real *, real *, integer *, real *,
00040 integer *), strmv_(char *, char *, char *, integer *, real *,
00041 integer *, real *, integer *), slarfg_(
00042 integer *, real *, real *, integer *, real *), slacpy_(char *,
00043 integer *, integer *, real *, integer *, real *, integer *);
00044
00045
00046
00047
00048
00049
00050
00051
00052
00053
00054
00055
00056
00057
00058
00059
00060
00061
00062
00063
00064
00065
00066
00067
00068
00069
00070
00071
00072
00073
00074
00075
00076
00077
00078
00079
00080
00081
00082
00083
00084
00085
00086
00087
00088
00089
00090
00091
00092
00093
00094
00095
00096
00097
00098
00099
00100
00101
00102
00103
00104
00105
00106
00107
00108
00109
00110
00111
00112
00113
00114
00115
00116
00117
00118
00119
00120
00121
00122
00123
00124
00125
00126
00127
00128
00129
00130
00131
00132
00133
00134
00135
00136
00137
00138
00139
00140
00141
00142
00143
00144
00145
00146
00147
00148
00149
00150
00151
00152
00153
00154
00155
00156
00157
00158
00159
00160
00161
00162
00163
00164 --tau;
00165 a_dim1 = *lda;
00166 a_offset = 1 + a_dim1;
00167 a -= a_offset;
00168 t_dim1 = *ldt;
00169 t_offset = 1 + t_dim1;
00170 t -= t_offset;
00171 y_dim1 = *ldy;
00172 y_offset = 1 + y_dim1;
00173 y -= y_offset;
00174
00175
00176 if (*n <= 1) {
00177 return 0;
00178 }
00179
00180 i__1 = *nb;
00181 for (i__ = 1; i__ <= i__1; ++i__) {
00182 if (i__ > 1) {
00183
00184
00185
00186
00187
00188 i__2 = *n - *k;
00189 i__3 = i__ - 1;
00190 sgemv_("NO TRANSPOSE", &i__2, &i__3, &c_b4, &y[*k + 1 + y_dim1],
00191 ldy, &a[*k + i__ - 1 + a_dim1], lda, &c_b5, &a[*k + 1 +
00192 i__ * a_dim1], &c__1);
00193
00194
00195
00196
00197
00198
00199
00200
00201
00202
00203
00204 i__2 = i__ - 1;
00205 scopy_(&i__2, &a[*k + 1 + i__ * a_dim1], &c__1, &t[*nb * t_dim1 +
00206 1], &c__1);
00207 i__2 = i__ - 1;
00208 strmv_("Lower", "Transpose", "UNIT", &i__2, &a[*k + 1 + a_dim1],
00209 lda, &t[*nb * t_dim1 + 1], &c__1);
00210
00211
00212
00213 i__2 = *n - *k - i__ + 1;
00214 i__3 = i__ - 1;
00215 sgemv_("Transpose", &i__2, &i__3, &c_b5, &a[*k + i__ + a_dim1],
00216 lda, &a[*k + i__ + i__ * a_dim1], &c__1, &c_b5, &t[*nb *
00217 t_dim1 + 1], &c__1);
00218
00219
00220
00221 i__2 = i__ - 1;
00222 strmv_("Upper", "Transpose", "NON-UNIT", &i__2, &t[t_offset], ldt,
00223 &t[*nb * t_dim1 + 1], &c__1);
00224
00225
00226
00227 i__2 = *n - *k - i__ + 1;
00228 i__3 = i__ - 1;
00229 sgemv_("NO TRANSPOSE", &i__2, &i__3, &c_b4, &a[*k + i__ + a_dim1],
00230 lda, &t[*nb * t_dim1 + 1], &c__1, &c_b5, &a[*k + i__ +
00231 i__ * a_dim1], &c__1);
00232
00233
00234
00235 i__2 = i__ - 1;
00236 strmv_("Lower", "NO TRANSPOSE", "UNIT", &i__2, &a[*k + 1 + a_dim1]
00237 , lda, &t[*nb * t_dim1 + 1], &c__1);
00238 i__2 = i__ - 1;
00239 saxpy_(&i__2, &c_b4, &t[*nb * t_dim1 + 1], &c__1, &a[*k + 1 + i__
00240 * a_dim1], &c__1);
00241
00242 a[*k + i__ - 1 + (i__ - 1) * a_dim1] = ei;
00243 }
00244
00245
00246
00247
00248 i__2 = *n - *k - i__ + 1;
00249
00250 i__3 = *k + i__ + 1;
00251 slarfg_(&i__2, &a[*k + i__ + i__ * a_dim1], &a[min(i__3, *n)+ i__ *
00252 a_dim1], &c__1, &tau[i__]);
00253 ei = a[*k + i__ + i__ * a_dim1];
00254 a[*k + i__ + i__ * a_dim1] = 1.f;
00255
00256
00257
00258 i__2 = *n - *k;
00259 i__3 = *n - *k - i__ + 1;
00260 sgemv_("NO TRANSPOSE", &i__2, &i__3, &c_b5, &a[*k + 1 + (i__ + 1) *
00261 a_dim1], lda, &a[*k + i__ + i__ * a_dim1], &c__1, &c_b38, &y[*
00262 k + 1 + i__ * y_dim1], &c__1);
00263 i__2 = *n - *k - i__ + 1;
00264 i__3 = i__ - 1;
00265 sgemv_("Transpose", &i__2, &i__3, &c_b5, &a[*k + i__ + a_dim1], lda, &
00266 a[*k + i__ + i__ * a_dim1], &c__1, &c_b38, &t[i__ * t_dim1 +
00267 1], &c__1);
00268 i__2 = *n - *k;
00269 i__3 = i__ - 1;
00270 sgemv_("NO TRANSPOSE", &i__2, &i__3, &c_b4, &y[*k + 1 + y_dim1], ldy,
00271 &t[i__ * t_dim1 + 1], &c__1, &c_b5, &y[*k + 1 + i__ * y_dim1],
00272 &c__1);
00273 i__2 = *n - *k;
00274 sscal_(&i__2, &tau[i__], &y[*k + 1 + i__ * y_dim1], &c__1);
00275
00276
00277
00278 i__2 = i__ - 1;
00279 r__1 = -tau[i__];
00280 sscal_(&i__2, &r__1, &t[i__ * t_dim1 + 1], &c__1);
00281 i__2 = i__ - 1;
00282 strmv_("Upper", "No Transpose", "NON-UNIT", &i__2, &t[t_offset], ldt,
00283 &t[i__ * t_dim1 + 1], &c__1)
00284 ;
00285 t[i__ + i__ * t_dim1] = tau[i__];
00286
00287
00288 }
00289 a[*k + *nb + *nb * a_dim1] = ei;
00290
00291
00292
00293 slacpy_("ALL", k, nb, &a[(a_dim1 << 1) + 1], lda, &y[y_offset], ldy);
00294 strmm_("RIGHT", "Lower", "NO TRANSPOSE", "UNIT", k, nb, &c_b5, &a[*k + 1
00295 + a_dim1], lda, &y[y_offset], ldy);
00296 if (*n > *k + *nb) {
00297 i__1 = *n - *k - *nb;
00298 sgemm_("NO TRANSPOSE", "NO TRANSPOSE", k, nb, &i__1, &c_b5, &a[(*nb +
00299 2) * a_dim1 + 1], lda, &a[*k + 1 + *nb + a_dim1], lda, &c_b5,
00300 &y[y_offset], ldy);
00301 }
00302 strmm_("RIGHT", "Upper", "NO TRANSPOSE", "NON-UNIT", k, nb, &c_b5, &t[
00303 t_offset], ldt, &y[y_offset], ldy);
00304
00305 return 0;
00306
00307
00308
00309 }