/root/doris/contrib/openblas/lapack-netlib/SRC/dlasq2.c
Line | Count | Source |
1 | | #include <math.h> |
2 | | #include <stdlib.h> |
3 | | #include <string.h> |
4 | | #include <stdio.h> |
5 | | #include <complex.h> |
6 | | #ifdef complex |
7 | | #undef complex |
8 | | #endif |
9 | | #ifdef I |
10 | | #undef I |
11 | | #endif |
12 | | |
13 | | #if defined(_WIN64) |
14 | | typedef long long BLASLONG; |
15 | | typedef unsigned long long BLASULONG; |
16 | | #else |
17 | | typedef long BLASLONG; |
18 | | typedef unsigned long BLASULONG; |
19 | | #endif |
20 | | |
21 | | #ifdef LAPACK_ILP64 |
22 | | typedef BLASLONG blasint; |
23 | | #if defined(_WIN64) |
24 | | #define blasabs(x) llabs(x) |
25 | | #else |
26 | | #define blasabs(x) labs(x) |
27 | | #endif |
28 | | #else |
29 | | typedef int blasint; |
30 | | #define blasabs(x) abs(x) |
31 | | #endif |
32 | | |
33 | | typedef blasint integer; |
34 | | |
35 | | typedef unsigned int uinteger; |
36 | | typedef char *address; |
37 | | typedef short int shortint; |
38 | | typedef float real; |
39 | | typedef double doublereal; |
40 | | typedef struct { real r, i; } complex; |
41 | | typedef struct { doublereal r, i; } doublecomplex; |
42 | | #ifdef _MSC_VER |
43 | | static inline _Fcomplex Cf(complex *z) {_Fcomplex zz={z->r , z->i}; return zz;} |
44 | | static inline _Dcomplex Cd(doublecomplex *z) {_Dcomplex zz={z->r , z->i};return zz;} |
45 | | static inline _Fcomplex * _pCf(complex *z) {return (_Fcomplex*)z;} |
46 | | static inline _Dcomplex * _pCd(doublecomplex *z) {return (_Dcomplex*)z;} |
47 | | #else |
48 | 0 | static inline _Complex float Cf(complex *z) {return z->r + z->i*_Complex_I;} |
49 | 0 | static inline _Complex double Cd(doublecomplex *z) {return z->r + z->i*_Complex_I;} |
50 | 0 | static inline _Complex float * _pCf(complex *z) {return (_Complex float*)z;} |
51 | 0 | static inline _Complex double * _pCd(doublecomplex *z) {return (_Complex double*)z;} |
52 | | #endif |
53 | | #define pCf(z) (*_pCf(z)) |
54 | | #define pCd(z) (*_pCd(z)) |
55 | | typedef blasint logical; |
56 | | |
57 | | typedef char logical1; |
58 | | typedef char integer1; |
59 | | |
60 | | #define TRUE_ (1) |
61 | | #define FALSE_ (0) |
62 | | |
63 | | /* Extern is for use with -E */ |
64 | | #ifndef Extern |
65 | | #define Extern extern |
66 | | #endif |
67 | | |
68 | | /* I/O stuff */ |
69 | | |
70 | | typedef int flag; |
71 | | typedef int ftnlen; |
72 | | typedef int ftnint; |
73 | | |
74 | | /*external read, write*/ |
75 | | typedef struct |
76 | | { flag cierr; |
77 | | ftnint ciunit; |
78 | | flag ciend; |
79 | | char *cifmt; |
80 | | ftnint cirec; |
81 | | } cilist; |
82 | | |
83 | | /*internal read, write*/ |
84 | | typedef struct |
85 | | { flag icierr; |
86 | | char *iciunit; |
87 | | flag iciend; |
88 | | char *icifmt; |
89 | | ftnint icirlen; |
90 | | ftnint icirnum; |
91 | | } icilist; |
92 | | |
93 | | /*open*/ |
94 | | typedef struct |
95 | | { flag oerr; |
96 | | ftnint ounit; |
97 | | char *ofnm; |
98 | | ftnlen ofnmlen; |
99 | | char *osta; |
100 | | char *oacc; |
101 | | char *ofm; |
102 | | ftnint orl; |
103 | | char *oblnk; |
104 | | } olist; |
105 | | |
106 | | /*close*/ |
107 | | typedef struct |
108 | | { flag cerr; |
109 | | ftnint cunit; |
110 | | char *csta; |
111 | | } cllist; |
112 | | |
113 | | /*rewind, backspace, endfile*/ |
114 | | typedef struct |
115 | | { flag aerr; |
116 | | ftnint aunit; |
117 | | } alist; |
118 | | |
119 | | /* inquire */ |
120 | | typedef struct |
121 | | { flag inerr; |
122 | | ftnint inunit; |
123 | | char *infile; |
124 | | ftnlen infilen; |
125 | | ftnint *inex; /*parameters in standard's order*/ |
126 | | ftnint *inopen; |
127 | | ftnint *innum; |
128 | | ftnint *innamed; |
129 | | char *inname; |
130 | | ftnlen innamlen; |
131 | | char *inacc; |
132 | | ftnlen inacclen; |
133 | | char *inseq; |
134 | | ftnlen inseqlen; |
135 | | char *indir; |
136 | | ftnlen indirlen; |
137 | | char *infmt; |
138 | | ftnlen infmtlen; |
139 | | char *inform; |
140 | | ftnint informlen; |
141 | | char *inunf; |
142 | | ftnlen inunflen; |
143 | | ftnint *inrecl; |
144 | | ftnint *innrec; |
145 | | char *inblank; |
146 | | ftnlen inblanklen; |
147 | | } inlist; |
148 | | |
149 | | #define VOID void |
150 | | |
151 | | union Multitype { /* for multiple entry points */ |
152 | | integer1 g; |
153 | | shortint h; |
154 | | integer i; |
155 | | /* longint j; */ |
156 | | real r; |
157 | | doublereal d; |
158 | | complex c; |
159 | | doublecomplex z; |
160 | | }; |
161 | | |
162 | | typedef union Multitype Multitype; |
163 | | |
164 | | struct Vardesc { /* for Namelist */ |
165 | | char *name; |
166 | | char *addr; |
167 | | ftnlen *dims; |
168 | | int type; |
169 | | }; |
170 | | typedef struct Vardesc Vardesc; |
171 | | |
172 | | struct Namelist { |
173 | | char *name; |
174 | | Vardesc **vars; |
175 | | int nvars; |
176 | | }; |
177 | | typedef struct Namelist Namelist; |
178 | | |
179 | 0 | #define abs(x) ((x) >= 0 ? (x) : -(x)) |
180 | | #define dabs(x) (fabs(x)) |
181 | 0 | #define f2cmin(a,b) ((a) <= (b) ? (a) : (b)) |
182 | 0 | #define f2cmax(a,b) ((a) >= (b) ? (a) : (b)) |
183 | | #define dmin(a,b) (f2cmin(a,b)) |
184 | | #define dmax(a,b) (f2cmax(a,b)) |
185 | | #define bit_test(a,b) ((a) >> (b) & 1) |
186 | | #define bit_clear(a,b) ((a) & ~((uinteger)1 << (b))) |
187 | | #define bit_set(a,b) ((a) | ((uinteger)1 << (b))) |
188 | | |
189 | | #define abort_() { sig_die("Fortran abort routine called", 1); } |
190 | | #define c_abs(z) (cabsf(Cf(z))) |
191 | | #define c_cos(R,Z) { pCf(R)=ccos(Cf(Z)); } |
192 | | #ifdef _MSC_VER |
193 | | #define c_div(c, a, b) {Cf(c)._Val[0] = (Cf(a)._Val[0]/Cf(b)._Val[0]); Cf(c)._Val[1]=(Cf(a)._Val[1]/Cf(b)._Val[1]);} |
194 | | #define z_div(c, a, b) {Cd(c)._Val[0] = (Cd(a)._Val[0]/Cd(b)._Val[0]); Cd(c)._Val[1]=(Cd(a)._Val[1]/df(b)._Val[1]);} |
195 | | #else |
196 | | #define c_div(c, a, b) {pCf(c) = Cf(a)/Cf(b);} |
197 | | #define z_div(c, a, b) {pCd(c) = Cd(a)/Cd(b);} |
198 | | #endif |
199 | | #define c_exp(R, Z) {pCf(R) = cexpf(Cf(Z));} |
200 | | #define c_log(R, Z) {pCf(R) = clogf(Cf(Z));} |
201 | | #define c_sin(R, Z) {pCf(R) = csinf(Cf(Z));} |
202 | | //#define c_sqrt(R, Z) {*(R) = csqrtf(Cf(Z));} |
203 | | #define c_sqrt(R, Z) {pCf(R) = csqrtf(Cf(Z));} |
204 | | #define d_abs(x) (fabs(*(x))) |
205 | | #define d_acos(x) (acos(*(x))) |
206 | | #define d_asin(x) (asin(*(x))) |
207 | | #define d_atan(x) (atan(*(x))) |
208 | | #define d_atn2(x, y) (atan2(*(x),*(y))) |
209 | | #define d_cnjg(R, Z) { pCd(R) = conj(Cd(Z)); } |
210 | | #define r_cnjg(R, Z) { pCf(R) = conjf(Cf(Z)); } |
211 | | #define d_cos(x) (cos(*(x))) |
212 | | #define d_cosh(x) (cosh(*(x))) |
213 | | #define d_dim(__a, __b) ( *(__a) > *(__b) ? *(__a) - *(__b) : 0.0 ) |
214 | | #define d_exp(x) (exp(*(x))) |
215 | | #define d_imag(z) (cimag(Cd(z))) |
216 | | #define r_imag(z) (cimagf(Cf(z))) |
217 | | #define d_int(__x) (*(__x)>0 ? floor(*(__x)) : -floor(- *(__x))) |
218 | | #define r_int(__x) (*(__x)>0 ? floor(*(__x)) : -floor(- *(__x))) |
219 | | #define d_lg10(x) ( 0.43429448190325182765 * log(*(x)) ) |
220 | | #define r_lg10(x) ( 0.43429448190325182765 * log(*(x)) ) |
221 | | #define d_log(x) (log(*(x))) |
222 | | #define d_mod(x, y) (fmod(*(x), *(y))) |
223 | | #define u_nint(__x) ((__x)>=0 ? floor((__x) + .5) : -floor(.5 - (__x))) |
224 | | #define d_nint(x) u_nint(*(x)) |
225 | | #define u_sign(__a,__b) ((__b) >= 0 ? ((__a) >= 0 ? (__a) : -(__a)) : -((__a) >= 0 ? (__a) : -(__a))) |
226 | | #define d_sign(a,b) u_sign(*(a),*(b)) |
227 | | #define r_sign(a,b) u_sign(*(a),*(b)) |
228 | | #define d_sin(x) (sin(*(x))) |
229 | | #define d_sinh(x) (sinh(*(x))) |
230 | | #define d_sqrt(x) (sqrt(*(x))) |
231 | | #define d_tan(x) (tan(*(x))) |
232 | | #define d_tanh(x) (tanh(*(x))) |
233 | | #define i_abs(x) abs(*(x)) |
234 | | #define i_dnnt(x) ((integer)u_nint(*(x))) |
235 | | #define i_len(s, n) (n) |
236 | | #define i_nint(x) ((integer)u_nint(*(x))) |
237 | | #define i_sign(a,b) ((integer)u_sign((integer)*(a),(integer)*(b))) |
238 | | #define pow_dd(ap, bp) ( pow(*(ap), *(bp))) |
239 | | #define pow_si(B,E) spow_ui(*(B),*(E)) |
240 | | #define pow_ri(B,E) spow_ui(*(B),*(E)) |
241 | | #define pow_di(B,E) dpow_ui(*(B),*(E)) |
242 | | #define pow_zi(p, a, b) {pCd(p) = zpow_ui(Cd(a), *(b));} |
243 | | #define pow_ci(p, a, b) {pCf(p) = cpow_ui(Cf(a), *(b));} |
244 | | #define pow_zz(R,A,B) {pCd(R) = cpow(Cd(A),*(B));} |
245 | | #define s_cat(lpp, rpp, rnp, np, llp) { ftnlen i, nc, ll; char *f__rp, *lp; ll = (llp); lp = (lpp); for(i=0; i < (int)*(np); ++i) { nc = ll; if((rnp)[i] < nc) nc = (rnp)[i]; ll -= nc; f__rp = (rpp)[i]; while(--nc >= 0) *lp++ = *(f__rp)++; } while(--ll >= 0) *lp++ = ' '; } |
246 | | #define s_cmp(a,b,c,d) ((integer)strncmp((a),(b),f2cmin((c),(d)))) |
247 | | #define s_copy(A,B,C,D) { int __i,__m; for (__i=0, __m=f2cmin((C),(D)); __i<__m && (B)[__i] != 0; ++__i) (A)[__i] = (B)[__i]; } |
248 | | #define sig_die(s, kill) { exit(1); } |
249 | | #define s_stop(s, n) {exit(0);} |
250 | | static char junk[] = "\n@(#)LIBF77 VERSION 19990503\n"; |
251 | | #define z_abs(z) (cabs(Cd(z))) |
252 | | #define z_exp(R, Z) {pCd(R) = cexp(Cd(Z));} |
253 | | #define z_sqrt(R, Z) {pCd(R) = csqrt(Cd(Z));} |
254 | | #define myexit_() break; |
255 | | #define mycycle() continue; |
256 | | #define myceiling(w) {ceil(w)} |
257 | | #define myhuge(w) {HUGE_VAL} |
258 | | //#define mymaxloc_(w,s,e,n) {if (sizeof(*(w)) == sizeof(double)) dmaxloc_((w),*(s),*(e),n); else dmaxloc_((w),*(s),*(e),n);} |
259 | | #define mymaxloc(w,s,e,n) {dmaxloc_(w,*(s),*(e),n)} |
260 | | |
261 | | /* procedure parameter types for -A and -C++ */ |
262 | | |
263 | | |
264 | | #ifdef __cplusplus |
265 | | typedef logical (*L_fp)(...); |
266 | | #else |
267 | | typedef logical (*L_fp)(); |
268 | | #endif |
269 | | |
270 | 0 | static float spow_ui(float x, integer n) { |
271 | 0 | float pow=1.0; unsigned long int u; |
272 | 0 | if(n != 0) { |
273 | 0 | if(n < 0) n = -n, x = 1/x; |
274 | 0 | for(u = n; ; ) { |
275 | 0 | if(u & 01) pow *= x; |
276 | 0 | if(u >>= 1) x *= x; |
277 | 0 | else break; |
278 | 0 | } |
279 | 0 | } |
280 | 0 | return pow; |
281 | 0 | } |
282 | 0 | static double dpow_ui(double x, integer n) { |
283 | 0 | double pow=1.0; unsigned long int u; |
284 | 0 | if(n != 0) { |
285 | 0 | if(n < 0) n = -n, x = 1/x; |
286 | 0 | for(u = n; ; ) { |
287 | 0 | if(u & 01) pow *= x; |
288 | 0 | if(u >>= 1) x *= x; |
289 | 0 | else break; |
290 | 0 | } |
291 | 0 | } |
292 | 0 | return pow; |
293 | 0 | } |
294 | | #ifdef _MSC_VER |
295 | | static _Fcomplex cpow_ui(complex x, integer n) { |
296 | | complex pow={1.0,0.0}; unsigned long int u; |
297 | | if(n != 0) { |
298 | | if(n < 0) n = -n, x.r = 1/x.r, x.i=1/x.i; |
299 | | for(u = n; ; ) { |
300 | | if(u & 01) pow.r *= x.r, pow.i *= x.i; |
301 | | if(u >>= 1) x.r *= x.r, x.i *= x.i; |
302 | | else break; |
303 | | } |
304 | | } |
305 | | _Fcomplex p={pow.r, pow.i}; |
306 | | return p; |
307 | | } |
308 | | #else |
309 | 0 | static _Complex float cpow_ui(_Complex float x, integer n) { |
310 | 0 | _Complex float pow=1.0; unsigned long int u; |
311 | 0 | if(n != 0) { |
312 | 0 | if(n < 0) n = -n, x = 1/x; |
313 | 0 | for(u = n; ; ) { |
314 | 0 | if(u & 01) pow *= x; |
315 | 0 | if(u >>= 1) x *= x; |
316 | 0 | else break; |
317 | 0 | } |
318 | 0 | } |
319 | 0 | return pow; |
320 | 0 | } |
321 | | #endif |
322 | | #ifdef _MSC_VER |
323 | | static _Dcomplex zpow_ui(_Dcomplex x, integer n) { |
324 | | _Dcomplex pow={1.0,0.0}; unsigned long int u; |
325 | | if(n != 0) { |
326 | | if(n < 0) n = -n, x._Val[0] = 1/x._Val[0], x._Val[1] =1/x._Val[1]; |
327 | | for(u = n; ; ) { |
328 | | if(u & 01) pow._Val[0] *= x._Val[0], pow._Val[1] *= x._Val[1]; |
329 | | if(u >>= 1) x._Val[0] *= x._Val[0], x._Val[1] *= x._Val[1]; |
330 | | else break; |
331 | | } |
332 | | } |
333 | | _Dcomplex p = {pow._Val[0], pow._Val[1]}; |
334 | | return p; |
335 | | } |
336 | | #else |
337 | 0 | static _Complex double zpow_ui(_Complex double x, integer n) { |
338 | 0 | _Complex double pow=1.0; unsigned long int u; |
339 | 0 | if(n != 0) { |
340 | 0 | if(n < 0) n = -n, x = 1/x; |
341 | 0 | for(u = n; ; ) { |
342 | 0 | if(u & 01) pow *= x; |
343 | 0 | if(u >>= 1) x *= x; |
344 | 0 | else break; |
345 | 0 | } |
346 | 0 | } |
347 | 0 | return pow; |
348 | 0 | } |
349 | | #endif |
350 | 0 | static integer pow_ii(integer x, integer n) { |
351 | 0 | integer pow; unsigned long int u; |
352 | 0 | if (n <= 0) { |
353 | 0 | if (n == 0 || x == 1) pow = 1; |
354 | 0 | else if (x != -1) pow = x == 0 ? 1/x : 0; |
355 | 0 | else n = -n; |
356 | 0 | } |
357 | 0 | if ((n > 0) || !(n == 0 || x == 1 || x != -1)) { |
358 | 0 | u = n; |
359 | 0 | for(pow = 1; ; ) { |
360 | 0 | if(u & 01) pow *= x; |
361 | 0 | if(u >>= 1) x *= x; |
362 | 0 | else break; |
363 | 0 | } |
364 | 0 | } |
365 | 0 | return pow; |
366 | 0 | } |
367 | | static integer dmaxloc_(double *w, integer s, integer e, integer *n) |
368 | 0 | { |
369 | 0 | double m; integer i, mi; |
370 | 0 | for(m=w[s-1], mi=s, i=s+1; i<=e; i++) |
371 | 0 | if (w[i-1]>m) mi=i ,m=w[i-1]; |
372 | 0 | return mi-s+1; |
373 | 0 | } |
374 | | static integer smaxloc_(float *w, integer s, integer e, integer *n) |
375 | 0 | { |
376 | 0 | float m; integer i, mi; |
377 | 0 | for(m=w[s-1], mi=s, i=s+1; i<=e; i++) |
378 | 0 | if (w[i-1]>m) mi=i ,m=w[i-1]; |
379 | 0 | return mi-s+1; |
380 | 0 | } |
381 | 0 | static inline void cdotc_(complex *z, integer *n_, complex *x, integer *incx_, complex *y, integer *incy_) { |
382 | 0 | integer n = *n_, incx = *incx_, incy = *incy_, i; |
383 | 0 | #ifdef _MSC_VER |
384 | 0 | _Fcomplex zdotc = {0.0, 0.0}; |
385 | 0 | if (incx == 1 && incy == 1) { |
386 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
387 | 0 | zdotc._Val[0] += conjf(Cf(&x[i]))._Val[0] * Cf(&y[i])._Val[0]; |
388 | 0 | zdotc._Val[1] += conjf(Cf(&x[i]))._Val[1] * Cf(&y[i])._Val[1]; |
389 | 0 | } |
390 | 0 | } else { |
391 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
392 | 0 | zdotc._Val[0] += conjf(Cf(&x[i*incx]))._Val[0] * Cf(&y[i*incy])._Val[0]; |
393 | 0 | zdotc._Val[1] += conjf(Cf(&x[i*incx]))._Val[1] * Cf(&y[i*incy])._Val[1]; |
394 | 0 | } |
395 | 0 | } |
396 | 0 | pCf(z) = zdotc; |
397 | 0 | } |
398 | 0 | #else |
399 | 0 | _Complex float zdotc = 0.0; |
400 | 0 | if (incx == 1 && incy == 1) { |
401 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
402 | 0 | zdotc += conjf(Cf(&x[i])) * Cf(&y[i]); |
403 | 0 | } |
404 | 0 | } else { |
405 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
406 | 0 | zdotc += conjf(Cf(&x[i*incx])) * Cf(&y[i*incy]); |
407 | 0 | } |
408 | 0 | } |
409 | 0 | pCf(z) = zdotc; |
410 | 0 | } |
411 | | #endif |
412 | 0 | static inline void zdotc_(doublecomplex *z, integer *n_, doublecomplex *x, integer *incx_, doublecomplex *y, integer *incy_) { |
413 | 0 | integer n = *n_, incx = *incx_, incy = *incy_, i; |
414 | 0 | #ifdef _MSC_VER |
415 | 0 | _Dcomplex zdotc = {0.0, 0.0}; |
416 | 0 | if (incx == 1 && incy == 1) { |
417 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
418 | 0 | zdotc._Val[0] += conj(Cd(&x[i]))._Val[0] * Cd(&y[i])._Val[0]; |
419 | 0 | zdotc._Val[1] += conj(Cd(&x[i]))._Val[1] * Cd(&y[i])._Val[1]; |
420 | 0 | } |
421 | 0 | } else { |
422 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
423 | 0 | zdotc._Val[0] += conj(Cd(&x[i*incx]))._Val[0] * Cd(&y[i*incy])._Val[0]; |
424 | 0 | zdotc._Val[1] += conj(Cd(&x[i*incx]))._Val[1] * Cd(&y[i*incy])._Val[1]; |
425 | 0 | } |
426 | 0 | } |
427 | 0 | pCd(z) = zdotc; |
428 | 0 | } |
429 | 0 | #else |
430 | 0 | _Complex double zdotc = 0.0; |
431 | 0 | if (incx == 1 && incy == 1) { |
432 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
433 | 0 | zdotc += conj(Cd(&x[i])) * Cd(&y[i]); |
434 | 0 | } |
435 | 0 | } else { |
436 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
437 | 0 | zdotc += conj(Cd(&x[i*incx])) * Cd(&y[i*incy]); |
438 | 0 | } |
439 | 0 | } |
440 | 0 | pCd(z) = zdotc; |
441 | 0 | } |
442 | | #endif |
443 | 0 | static inline void cdotu_(complex *z, integer *n_, complex *x, integer *incx_, complex *y, integer *incy_) { |
444 | 0 | integer n = *n_, incx = *incx_, incy = *incy_, i; |
445 | 0 | #ifdef _MSC_VER |
446 | 0 | _Fcomplex zdotc = {0.0, 0.0}; |
447 | 0 | if (incx == 1 && incy == 1) { |
448 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
449 | 0 | zdotc._Val[0] += Cf(&x[i])._Val[0] * Cf(&y[i])._Val[0]; |
450 | 0 | zdotc._Val[1] += Cf(&x[i])._Val[1] * Cf(&y[i])._Val[1]; |
451 | 0 | } |
452 | 0 | } else { |
453 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
454 | 0 | zdotc._Val[0] += Cf(&x[i*incx])._Val[0] * Cf(&y[i*incy])._Val[0]; |
455 | 0 | zdotc._Val[1] += Cf(&x[i*incx])._Val[1] * Cf(&y[i*incy])._Val[1]; |
456 | 0 | } |
457 | 0 | } |
458 | 0 | pCf(z) = zdotc; |
459 | 0 | } |
460 | 0 | #else |
461 | 0 | _Complex float zdotc = 0.0; |
462 | 0 | if (incx == 1 && incy == 1) { |
463 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
464 | 0 | zdotc += Cf(&x[i]) * Cf(&y[i]); |
465 | 0 | } |
466 | 0 | } else { |
467 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
468 | 0 | zdotc += Cf(&x[i*incx]) * Cf(&y[i*incy]); |
469 | 0 | } |
470 | 0 | } |
471 | 0 | pCf(z) = zdotc; |
472 | 0 | } |
473 | | #endif |
474 | 0 | static inline void zdotu_(doublecomplex *z, integer *n_, doublecomplex *x, integer *incx_, doublecomplex *y, integer *incy_) { |
475 | 0 | integer n = *n_, incx = *incx_, incy = *incy_, i; |
476 | 0 | #ifdef _MSC_VER |
477 | 0 | _Dcomplex zdotc = {0.0, 0.0}; |
478 | 0 | if (incx == 1 && incy == 1) { |
479 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
480 | 0 | zdotc._Val[0] += Cd(&x[i])._Val[0] * Cd(&y[i])._Val[0]; |
481 | 0 | zdotc._Val[1] += Cd(&x[i])._Val[1] * Cd(&y[i])._Val[1]; |
482 | 0 | } |
483 | 0 | } else { |
484 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
485 | 0 | zdotc._Val[0] += Cd(&x[i*incx])._Val[0] * Cd(&y[i*incy])._Val[0]; |
486 | 0 | zdotc._Val[1] += Cd(&x[i*incx])._Val[1] * Cd(&y[i*incy])._Val[1]; |
487 | 0 | } |
488 | 0 | } |
489 | 0 | pCd(z) = zdotc; |
490 | 0 | } |
491 | 0 | #else |
492 | 0 | _Complex double zdotc = 0.0; |
493 | 0 | if (incx == 1 && incy == 1) { |
494 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
495 | 0 | zdotc += Cd(&x[i]) * Cd(&y[i]); |
496 | 0 | } |
497 | 0 | } else { |
498 | 0 | for (i=0;i<n;i++) { /* zdotc = zdotc + dconjg(x(i))* y(i) */ |
499 | 0 | zdotc += Cd(&x[i*incx]) * Cd(&y[i*incy]); |
500 | 0 | } |
501 | 0 | } |
502 | 0 | pCd(z) = zdotc; |
503 | 0 | } |
504 | | #endif |
505 | | /* -- translated by f2c (version 20000121). |
506 | | You must link the resulting object file with the libraries: |
507 | | -lf2c -lm (in that order) |
508 | | */ |
509 | | |
510 | | |
511 | | |
512 | | |
513 | | /* Table of constant values */ |
514 | | |
515 | | static integer c__1 = 1; |
516 | | static integer c__2 = 2; |
517 | | static integer c__10 = 10; |
518 | | static integer c__3 = 3; |
519 | | static integer c__4 = 4; |
520 | | static integer c__11 = 11; |
521 | | |
522 | | /* > \brief \b DLASQ2 computes all the eigenvalues of the symmetric positive definite tridiagonal matrix assoc |
523 | | iated with the qd Array Z to high relative accuracy. Used by sbdsqr and sstegr. */ |
524 | | |
525 | | /* =========== DOCUMENTATION =========== */ |
526 | | |
527 | | /* Online html documentation available at */ |
528 | | /* http://www.netlib.org/lapack/explore-html/ */ |
529 | | |
530 | | /* > \htmlonly */ |
531 | | /* > Download DLASQ2 + dependencies */ |
532 | | /* > <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/dlasq2. |
533 | | f"> */ |
534 | | /* > [TGZ]</a> */ |
535 | | /* > <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/dlasq2. |
536 | | f"> */ |
537 | | /* > [ZIP]</a> */ |
538 | | /* > <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/dlasq2. |
539 | | f"> */ |
540 | | /* > [TXT]</a> */ |
541 | | /* > \endhtmlonly */ |
542 | | |
543 | | /* Definition: */ |
544 | | /* =========== */ |
545 | | |
546 | | /* SUBROUTINE DLASQ2( N, Z, INFO ) */ |
547 | | |
548 | | /* INTEGER INFO, N */ |
549 | | /* DOUBLE PRECISION Z( * ) */ |
550 | | |
551 | | |
552 | | /* > \par Purpose: */ |
553 | | /* ============= */ |
554 | | /* > */ |
555 | | /* > \verbatim */ |
556 | | /* > */ |
557 | | /* > DLASQ2 computes all the eigenvalues of the symmetric positive */ |
558 | | /* > definite tridiagonal matrix associated with the qd array Z to high */ |
559 | | /* > relative accuracy are computed to high relative accuracy, in the */ |
560 | | /* > absence of denormalization, underflow and overflow. */ |
561 | | /* > */ |
562 | | /* > To see the relation of Z to the tridiagonal matrix, let L be a */ |
563 | | /* > unit lower bidiagonal matrix with subdiagonals Z(2,4,6,,..) and */ |
564 | | /* > let U be an upper bidiagonal matrix with 1's above and diagonal */ |
565 | | /* > Z(1,3,5,,..). The tridiagonal is L*U or, if you prefer, the */ |
566 | | /* > symmetric tridiagonal to which it is similar. */ |
567 | | /* > */ |
568 | | /* > Note : DLASQ2 defines a logical variable, IEEE, which is true */ |
569 | | /* > on machines which follow ieee-754 floating-point standard in their */ |
570 | | /* > handling of infinities and NaNs, and false otherwise. This variable */ |
571 | | /* > is passed to DLASQ3. */ |
572 | | /* > \endverbatim */ |
573 | | |
574 | | /* Arguments: */ |
575 | | /* ========== */ |
576 | | |
577 | | /* > \param[in] N */ |
578 | | /* > \verbatim */ |
579 | | /* > N is INTEGER */ |
580 | | /* > The number of rows and columns in the matrix. N >= 0. */ |
581 | | /* > \endverbatim */ |
582 | | /* > */ |
583 | | /* > \param[in,out] Z */ |
584 | | /* > \verbatim */ |
585 | | /* > Z is DOUBLE PRECISION array, dimension ( 4*N ) */ |
586 | | /* > On entry Z holds the qd array. On exit, entries 1 to N hold */ |
587 | | /* > the eigenvalues in decreasing order, Z( 2*N+1 ) holds the */ |
588 | | /* > trace, and Z( 2*N+2 ) holds the sum of the eigenvalues. If */ |
589 | | /* > N > 2, then Z( 2*N+3 ) holds the iteration count, Z( 2*N+4 ) */ |
590 | | /* > holds NDIVS/NIN^2, and Z( 2*N+5 ) holds the percentage of */ |
591 | | /* > shifts that failed. */ |
592 | | /* > \endverbatim */ |
593 | | /* > */ |
594 | | /* > \param[out] INFO */ |
595 | | /* > \verbatim */ |
596 | | /* > INFO is INTEGER */ |
597 | | /* > = 0: successful exit */ |
598 | | /* > < 0: if the i-th argument is a scalar and had an illegal */ |
599 | | /* > value, then INFO = -i, if the i-th argument is an */ |
600 | | /* > array and the j-entry had an illegal value, then */ |
601 | | /* > INFO = -(i*100+j) */ |
602 | | /* > > 0: the algorithm failed */ |
603 | | /* > = 1, a split was marked by a positive value in E */ |
604 | | /* > = 2, current block of Z not diagonalized after 100*N */ |
605 | | /* > iterations (in inner while loop). On exit Z holds */ |
606 | | /* > a qd array with the same eigenvalues as the given Z. */ |
607 | | /* > = 3, termination criterion of outer while loop not met */ |
608 | | /* > (program created more than N unreduced blocks) */ |
609 | | /* > \endverbatim */ |
610 | | |
611 | | /* Authors: */ |
612 | | /* ======== */ |
613 | | |
614 | | /* > \author Univ. of Tennessee */ |
615 | | /* > \author Univ. of California Berkeley */ |
616 | | /* > \author Univ. of Colorado Denver */ |
617 | | /* > \author NAG Ltd. */ |
618 | | |
619 | | /* > \date December 2016 */ |
620 | | |
621 | | /* > \ingroup auxOTHERcomputational */ |
622 | | |
623 | | /* > \par Further Details: */ |
624 | | /* ===================== */ |
625 | | /* > */ |
626 | | /* > \verbatim */ |
627 | | /* > */ |
628 | | /* > Local Variables: I0:N0 defines a current unreduced segment of Z. */ |
629 | | /* > The shifts are accumulated in SIGMA. Iteration count is in ITER. */ |
630 | | /* > Ping-pong is controlled by PP (alternates between 0 and 1). */ |
631 | | /* > \endverbatim */ |
632 | | /* > */ |
633 | | /* ===================================================================== */ |
634 | | /* Subroutine */ void dlasq2_(integer *n, doublereal *z__, integer *info) |
635 | 0 | { |
636 | | /* System generated locals */ |
637 | 0 | integer i__1, i__2, i__3; |
638 | 0 | doublereal d__1, d__2; |
639 | | |
640 | | /* Local variables */ |
641 | 0 | logical ieee; |
642 | 0 | integer nbig; |
643 | 0 | doublereal dmin__, emin, emax; |
644 | 0 | integer kmin, ndiv, iter; |
645 | 0 | doublereal qmin, temp, qmax, zmax; |
646 | 0 | integer splt; |
647 | 0 | doublereal dmin1, dmin2, d__, e, g; |
648 | 0 | integer k; |
649 | 0 | doublereal s, t; |
650 | 0 | integer nfail; |
651 | 0 | doublereal desig, trace, sigma; |
652 | 0 | integer iinfo; |
653 | 0 | doublereal tempe, tempq; |
654 | 0 | integer i0, i1, i4, n0, n1, ttype; |
655 | 0 | extern /* Subroutine */ void dlasq3_(integer *, integer *, doublereal *, |
656 | 0 | integer *, doublereal *, doublereal *, doublereal *, doublereal *, |
657 | 0 | integer *, integer *, integer *, logical *, integer *, |
658 | 0 | doublereal *, doublereal *, doublereal *, doublereal *, |
659 | 0 | doublereal *, doublereal *, doublereal *); |
660 | 0 | doublereal dn; |
661 | 0 | extern doublereal dlamch_(char *); |
662 | 0 | integer pp; |
663 | 0 | doublereal deemin; |
664 | 0 | integer iwhila, iwhilb; |
665 | 0 | doublereal oldemn, safmin; |
666 | 0 | extern /* Subroutine */ int xerbla_(char *, integer *, ftnlen); |
667 | 0 | extern integer ilaenv_(integer *, char *, char *, integer *, integer *, |
668 | 0 | integer *, integer *, ftnlen, ftnlen); |
669 | 0 | extern /* Subroutine */ void dlasrt_(char *, integer *, doublereal *, |
670 | 0 | integer *); |
671 | 0 | doublereal dn1, dn2, dee, eps, tau, tol; |
672 | 0 | integer ipn4; |
673 | 0 | doublereal tol2; |
674 | | |
675 | | |
676 | | /* -- LAPACK computational routine (version 3.7.0) -- */ |
677 | | /* -- LAPACK is a software package provided by Univ. of Tennessee, -- */ |
678 | | /* -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..-- */ |
679 | | /* December 2016 */ |
680 | | |
681 | | |
682 | | /* ===================================================================== */ |
683 | | |
684 | | |
685 | | /* Test the input arguments. */ |
686 | | /* (in case DLASQ2 is not called by DLASQ1) */ |
687 | | |
688 | | /* Parameter adjustments */ |
689 | 0 | --z__; |
690 | | |
691 | | /* Function Body */ |
692 | 0 | *info = 0; |
693 | 0 | eps = dlamch_("Precision"); |
694 | 0 | safmin = dlamch_("Safe minimum"); |
695 | 0 | tol = eps * 100.; |
696 | | /* Computing 2nd power */ |
697 | 0 | d__1 = tol; |
698 | 0 | tol2 = d__1 * d__1; |
699 | |
|
700 | 0 | if (*n < 0) { |
701 | 0 | *info = -1; |
702 | 0 | xerbla_("DLASQ2", &c__1, (ftnlen)6); |
703 | 0 | return; |
704 | 0 | } else if (*n == 0) { |
705 | 0 | return; |
706 | 0 | } else if (*n == 1) { |
707 | | |
708 | | /* 1-by-1 case. */ |
709 | |
|
710 | 0 | if (z__[1] < 0.) { |
711 | 0 | *info = -201; |
712 | 0 | xerbla_("DLASQ2", &c__2, (ftnlen)6); |
713 | 0 | } |
714 | 0 | return; |
715 | 0 | } else if (*n == 2) { |
716 | | |
717 | | /* 2-by-2 case. */ |
718 | |
|
719 | 0 | if (z__[1] < 0.) { |
720 | 0 | *info = -201; |
721 | 0 | xerbla_("DLASQ2", &c__2, (ftnlen)6); |
722 | 0 | return; |
723 | 0 | } else if (z__[2] < 0.) { |
724 | 0 | *info = -202; |
725 | 0 | xerbla_("DLASQ2", &c__2, (ftnlen)6); |
726 | 0 | return; |
727 | 0 | } else if (z__[3] < 0.) { |
728 | 0 | *info = -203; |
729 | 0 | xerbla_("DLASQ2", &c__2, (ftnlen)6); |
730 | 0 | return; |
731 | 0 | } else if (z__[3] > z__[1]) { |
732 | 0 | d__ = z__[3]; |
733 | 0 | z__[3] = z__[1]; |
734 | 0 | z__[1] = d__; |
735 | 0 | } |
736 | 0 | z__[5] = z__[1] + z__[2] + z__[3]; |
737 | 0 | if (z__[2] > z__[3] * tol2) { |
738 | 0 | t = (z__[1] - z__[3] + z__[2]) * .5; |
739 | 0 | s = z__[3] * (z__[2] / t); |
740 | 0 | if (s <= t) { |
741 | 0 | s = z__[3] * (z__[2] / (t * (sqrt(s / t + 1.) + 1.))); |
742 | 0 | } else { |
743 | 0 | s = z__[3] * (z__[2] / (t + sqrt(t) * sqrt(t + s))); |
744 | 0 | } |
745 | 0 | t = z__[1] + (s + z__[2]); |
746 | 0 | z__[3] *= z__[1] / t; |
747 | 0 | z__[1] = t; |
748 | 0 | } |
749 | 0 | z__[2] = z__[3]; |
750 | 0 | z__[6] = z__[2] + z__[1]; |
751 | 0 | return; |
752 | 0 | } |
753 | | |
754 | | /* Check for negative data and compute sums of q's and e's. */ |
755 | | |
756 | 0 | z__[*n * 2] = 0.; |
757 | 0 | emin = z__[2]; |
758 | 0 | qmax = 0.; |
759 | 0 | zmax = 0.; |
760 | 0 | d__ = 0.; |
761 | 0 | e = 0.; |
762 | |
|
763 | 0 | i__1 = *n - 1 << 1; |
764 | 0 | for (k = 1; k <= i__1; k += 2) { |
765 | 0 | if (z__[k] < 0.) { |
766 | 0 | *info = -(k + 200); |
767 | 0 | xerbla_("DLASQ2", &c__2, (ftnlen)6); |
768 | 0 | return; |
769 | 0 | } else if (z__[k + 1] < 0.) { |
770 | 0 | *info = -(k + 201); |
771 | 0 | xerbla_("DLASQ2", &c__2, (ftnlen)6); |
772 | 0 | return; |
773 | 0 | } |
774 | 0 | d__ += z__[k]; |
775 | 0 | e += z__[k + 1]; |
776 | | /* Computing MAX */ |
777 | 0 | d__1 = qmax, d__2 = z__[k]; |
778 | 0 | qmax = f2cmax(d__1,d__2); |
779 | | /* Computing MIN */ |
780 | 0 | d__1 = emin, d__2 = z__[k + 1]; |
781 | 0 | emin = f2cmin(d__1,d__2); |
782 | | /* Computing MAX */ |
783 | 0 | d__1 = f2cmax(qmax,zmax), d__2 = z__[k + 1]; |
784 | 0 | zmax = f2cmax(d__1,d__2); |
785 | | /* L10: */ |
786 | 0 | } |
787 | 0 | if (z__[(*n << 1) - 1] < 0.) { |
788 | 0 | *info = -((*n << 1) + 199); |
789 | 0 | xerbla_("DLASQ2", &c__2, (ftnlen)6); |
790 | 0 | return; |
791 | 0 | } |
792 | 0 | d__ += z__[(*n << 1) - 1]; |
793 | | /* Computing MAX */ |
794 | 0 | d__1 = qmax, d__2 = z__[(*n << 1) - 1]; |
795 | 0 | qmax = f2cmax(d__1,d__2); |
796 | 0 | zmax = f2cmax(qmax,zmax); |
797 | | |
798 | | /* Check for diagonality. */ |
799 | |
|
800 | 0 | if (e == 0.) { |
801 | 0 | i__1 = *n; |
802 | 0 | for (k = 2; k <= i__1; ++k) { |
803 | 0 | z__[k] = z__[(k << 1) - 1]; |
804 | | /* L20: */ |
805 | 0 | } |
806 | 0 | dlasrt_("D", n, &z__[1], &iinfo); |
807 | 0 | z__[(*n << 1) - 1] = d__; |
808 | 0 | return; |
809 | 0 | } |
810 | | |
811 | 0 | trace = d__ + e; |
812 | | |
813 | | /* Check for zero data. */ |
814 | |
|
815 | 0 | if (trace == 0.) { |
816 | 0 | z__[(*n << 1) - 1] = 0.; |
817 | 0 | return; |
818 | 0 | } |
819 | | |
820 | | /* Check whether the machine is IEEE conformable. */ |
821 | | |
822 | 0 | ieee = ilaenv_(&c__10, "DLASQ2", "N", &c__1, &c__2, &c__3, &c__4, (ftnlen) |
823 | 0 | 6, (ftnlen)1) == 1 && ilaenv_(&c__11, "DLASQ2", "N", &c__1, &c__2, |
824 | 0 | &c__3, &c__4, (ftnlen)6, (ftnlen)1) == 1; |
825 | | |
826 | | /* Rearrange data for locality: Z=(q1,qq1,e1,ee1,q2,qq2,e2,ee2,...). */ |
827 | |
|
828 | 0 | for (k = *n << 1; k >= 2; k += -2) { |
829 | 0 | z__[k * 2] = 0.; |
830 | 0 | z__[(k << 1) - 1] = z__[k]; |
831 | 0 | z__[(k << 1) - 2] = 0.; |
832 | 0 | z__[(k << 1) - 3] = z__[k - 1]; |
833 | | /* L30: */ |
834 | 0 | } |
835 | |
|
836 | 0 | i0 = 1; |
837 | 0 | n0 = *n; |
838 | | |
839 | | /* Reverse the qd-array, if warranted. */ |
840 | |
|
841 | 0 | if (z__[(i0 << 2) - 3] * 1.5 < z__[(n0 << 2) - 3]) { |
842 | 0 | ipn4 = i0 + n0 << 2; |
843 | 0 | i__1 = i0 + n0 - 1 << 1; |
844 | 0 | for (i4 = i0 << 2; i4 <= i__1; i4 += 4) { |
845 | 0 | temp = z__[i4 - 3]; |
846 | 0 | z__[i4 - 3] = z__[ipn4 - i4 - 3]; |
847 | 0 | z__[ipn4 - i4 - 3] = temp; |
848 | 0 | temp = z__[i4 - 1]; |
849 | 0 | z__[i4 - 1] = z__[ipn4 - i4 - 5]; |
850 | 0 | z__[ipn4 - i4 - 5] = temp; |
851 | | /* L40: */ |
852 | 0 | } |
853 | 0 | } |
854 | | |
855 | | /* Initial split checking via dqd and Li's test. */ |
856 | |
|
857 | 0 | pp = 0; |
858 | |
|
859 | 0 | for (k = 1; k <= 2; ++k) { |
860 | |
|
861 | 0 | d__ = z__[(n0 << 2) + pp - 3]; |
862 | 0 | i__1 = (i0 << 2) + pp; |
863 | 0 | for (i4 = (n0 - 1 << 2) + pp; i4 >= i__1; i4 += -4) { |
864 | 0 | if (z__[i4 - 1] <= tol2 * d__) { |
865 | 0 | z__[i4 - 1] = 0.; |
866 | 0 | d__ = z__[i4 - 3]; |
867 | 0 | } else { |
868 | 0 | d__ = z__[i4 - 3] * (d__ / (d__ + z__[i4 - 1])); |
869 | 0 | } |
870 | | /* L50: */ |
871 | 0 | } |
872 | | |
873 | | /* dqd maps Z to ZZ plus Li's test. */ |
874 | |
|
875 | 0 | emin = z__[(i0 << 2) + pp + 1]; |
876 | 0 | d__ = z__[(i0 << 2) + pp - 3]; |
877 | 0 | i__1 = (n0 - 1 << 2) + pp; |
878 | 0 | for (i4 = (i0 << 2) + pp; i4 <= i__1; i4 += 4) { |
879 | 0 | z__[i4 - (pp << 1) - 2] = d__ + z__[i4 - 1]; |
880 | 0 | if (z__[i4 - 1] <= tol2 * d__) { |
881 | 0 | z__[i4 - 1] = 0.; |
882 | 0 | z__[i4 - (pp << 1) - 2] = d__; |
883 | 0 | z__[i4 - (pp << 1)] = 0.; |
884 | 0 | d__ = z__[i4 + 1]; |
885 | 0 | } else if (safmin * z__[i4 + 1] < z__[i4 - (pp << 1) - 2] && |
886 | 0 | safmin * z__[i4 - (pp << 1) - 2] < z__[i4 + 1]) { |
887 | 0 | temp = z__[i4 + 1] / z__[i4 - (pp << 1) - 2]; |
888 | 0 | z__[i4 - (pp << 1)] = z__[i4 - 1] * temp; |
889 | 0 | d__ *= temp; |
890 | 0 | } else { |
891 | 0 | z__[i4 - (pp << 1)] = z__[i4 + 1] * (z__[i4 - 1] / z__[i4 - ( |
892 | 0 | pp << 1) - 2]); |
893 | 0 | d__ = z__[i4 + 1] * (d__ / z__[i4 - (pp << 1) - 2]); |
894 | 0 | } |
895 | | /* Computing MIN */ |
896 | 0 | d__1 = emin, d__2 = z__[i4 - (pp << 1)]; |
897 | 0 | emin = f2cmin(d__1,d__2); |
898 | | /* L60: */ |
899 | 0 | } |
900 | 0 | z__[(n0 << 2) - pp - 2] = d__; |
901 | | |
902 | | /* Now find qmax. */ |
903 | |
|
904 | 0 | qmax = z__[(i0 << 2) - pp - 2]; |
905 | 0 | i__1 = (n0 << 2) - pp - 2; |
906 | 0 | for (i4 = (i0 << 2) - pp + 2; i4 <= i__1; i4 += 4) { |
907 | | /* Computing MAX */ |
908 | 0 | d__1 = qmax, d__2 = z__[i4]; |
909 | 0 | qmax = f2cmax(d__1,d__2); |
910 | | /* L70: */ |
911 | 0 | } |
912 | | |
913 | | /* Prepare for the next iteration on K. */ |
914 | |
|
915 | 0 | pp = 1 - pp; |
916 | | /* L80: */ |
917 | 0 | } |
918 | | |
919 | | /* Initialise variables to pass to DLASQ3. */ |
920 | |
|
921 | 0 | ttype = 0; |
922 | 0 | dmin1 = 0.; |
923 | 0 | dmin2 = 0.; |
924 | 0 | dn = 0.; |
925 | 0 | dn1 = 0.; |
926 | 0 | dn2 = 0.; |
927 | 0 | g = 0.; |
928 | 0 | tau = 0.; |
929 | |
|
930 | 0 | iter = 2; |
931 | 0 | nfail = 0; |
932 | 0 | ndiv = n0 - i0 << 1; |
933 | |
|
934 | 0 | i__1 = *n + 1; |
935 | 0 | for (iwhila = 1; iwhila <= i__1; ++iwhila) { |
936 | 0 | if (n0 < 1) { |
937 | 0 | goto L170; |
938 | 0 | } |
939 | | |
940 | | /* While array unfinished do */ |
941 | | |
942 | | /* E(N0) holds the value of SIGMA when submatrix in I0:N0 */ |
943 | | /* splits from the rest of the array, but is negated. */ |
944 | | |
945 | 0 | desig = 0.; |
946 | 0 | if (n0 == *n) { |
947 | 0 | sigma = 0.; |
948 | 0 | } else { |
949 | 0 | sigma = -z__[(n0 << 2) - 1]; |
950 | 0 | } |
951 | 0 | if (sigma < 0.) { |
952 | 0 | *info = 1; |
953 | 0 | return; |
954 | 0 | } |
955 | | |
956 | | /* Find last unreduced submatrix's top index I0, find QMAX and */ |
957 | | /* EMIN. Find Gershgorin-type bound if Q's much greater than E's. */ |
958 | | |
959 | 0 | emax = 0.; |
960 | 0 | if (n0 > i0) { |
961 | 0 | emin = (d__1 = z__[(n0 << 2) - 5], abs(d__1)); |
962 | 0 | } else { |
963 | 0 | emin = 0.; |
964 | 0 | } |
965 | 0 | qmin = z__[(n0 << 2) - 3]; |
966 | 0 | qmax = qmin; |
967 | 0 | for (i4 = n0 << 2; i4 >= 8; i4 += -4) { |
968 | 0 | if (z__[i4 - 5] <= 0.) { |
969 | 0 | goto L100; |
970 | 0 | } |
971 | 0 | if (qmin >= emax * 4.) { |
972 | | /* Computing MIN */ |
973 | 0 | d__1 = qmin, d__2 = z__[i4 - 3]; |
974 | 0 | qmin = f2cmin(d__1,d__2); |
975 | | /* Computing MAX */ |
976 | 0 | d__1 = emax, d__2 = z__[i4 - 5]; |
977 | 0 | emax = f2cmax(d__1,d__2); |
978 | 0 | } |
979 | | /* Computing MAX */ |
980 | 0 | d__1 = qmax, d__2 = z__[i4 - 7] + z__[i4 - 5]; |
981 | 0 | qmax = f2cmax(d__1,d__2); |
982 | | /* Computing MIN */ |
983 | 0 | d__1 = emin, d__2 = z__[i4 - 5]; |
984 | 0 | emin = f2cmin(d__1,d__2); |
985 | | /* L90: */ |
986 | 0 | } |
987 | 0 | i4 = 4; |
988 | |
|
989 | 0 | L100: |
990 | 0 | i0 = i4 / 4; |
991 | 0 | pp = 0; |
992 | |
|
993 | 0 | if (n0 - i0 > 1) { |
994 | 0 | dee = z__[(i0 << 2) - 3]; |
995 | 0 | deemin = dee; |
996 | 0 | kmin = i0; |
997 | 0 | i__2 = (n0 << 2) - 3; |
998 | 0 | for (i4 = (i0 << 2) + 1; i4 <= i__2; i4 += 4) { |
999 | 0 | dee = z__[i4] * (dee / (dee + z__[i4 - 2])); |
1000 | 0 | if (dee <= deemin) { |
1001 | 0 | deemin = dee; |
1002 | 0 | kmin = (i4 + 3) / 4; |
1003 | 0 | } |
1004 | | /* L110: */ |
1005 | 0 | } |
1006 | 0 | if (kmin - i0 << 1 < n0 - kmin && deemin <= z__[(n0 << 2) - 3] * |
1007 | 0 | .5) { |
1008 | 0 | ipn4 = i0 + n0 << 2; |
1009 | 0 | pp = 2; |
1010 | 0 | i__2 = i0 + n0 - 1 << 1; |
1011 | 0 | for (i4 = i0 << 2; i4 <= i__2; i4 += 4) { |
1012 | 0 | temp = z__[i4 - 3]; |
1013 | 0 | z__[i4 - 3] = z__[ipn4 - i4 - 3]; |
1014 | 0 | z__[ipn4 - i4 - 3] = temp; |
1015 | 0 | temp = z__[i4 - 2]; |
1016 | 0 | z__[i4 - 2] = z__[ipn4 - i4 - 2]; |
1017 | 0 | z__[ipn4 - i4 - 2] = temp; |
1018 | 0 | temp = z__[i4 - 1]; |
1019 | 0 | z__[i4 - 1] = z__[ipn4 - i4 - 5]; |
1020 | 0 | z__[ipn4 - i4 - 5] = temp; |
1021 | 0 | temp = z__[i4]; |
1022 | 0 | z__[i4] = z__[ipn4 - i4 - 4]; |
1023 | 0 | z__[ipn4 - i4 - 4] = temp; |
1024 | | /* L120: */ |
1025 | 0 | } |
1026 | 0 | } |
1027 | 0 | } |
1028 | | |
1029 | | /* Put -(initial shift) into DMIN. */ |
1030 | | |
1031 | | /* Computing MAX */ |
1032 | 0 | d__1 = 0., d__2 = qmin - sqrt(qmin) * 2. * sqrt(emax); |
1033 | 0 | dmin__ = -f2cmax(d__1,d__2); |
1034 | | |
1035 | | /* Now I0:N0 is unreduced. */ |
1036 | | /* PP = 0 for ping, PP = 1 for pong. */ |
1037 | | /* PP = 2 indicates that flipping was applied to the Z array and */ |
1038 | | /* and that the tests for deflation upon entry in DLASQ3 */ |
1039 | | /* should not be performed. */ |
1040 | |
|
1041 | 0 | nbig = (n0 - i0 + 1) * 100; |
1042 | 0 | i__2 = nbig; |
1043 | 0 | for (iwhilb = 1; iwhilb <= i__2; ++iwhilb) { |
1044 | 0 | if (i0 > n0) { |
1045 | 0 | goto L150; |
1046 | 0 | } |
1047 | | |
1048 | | /* While submatrix unfinished take a good dqds step. */ |
1049 | | |
1050 | 0 | dlasq3_(&i0, &n0, &z__[1], &pp, &dmin__, &sigma, &desig, &qmax, & |
1051 | 0 | nfail, &iter, &ndiv, &ieee, &ttype, &dmin1, &dmin2, &dn, & |
1052 | 0 | dn1, &dn2, &g, &tau); |
1053 | |
|
1054 | 0 | pp = 1 - pp; |
1055 | | |
1056 | | /* When EMIN is very small check for splits. */ |
1057 | |
|
1058 | 0 | if (pp == 0 && n0 - i0 >= 3) { |
1059 | 0 | if (z__[n0 * 4] <= tol2 * qmax || z__[(n0 << 2) - 1] <= tol2 * |
1060 | 0 | sigma) { |
1061 | 0 | splt = i0 - 1; |
1062 | 0 | qmax = z__[(i0 << 2) - 3]; |
1063 | 0 | emin = z__[(i0 << 2) - 1]; |
1064 | 0 | oldemn = z__[i0 * 4]; |
1065 | 0 | i__3 = n0 - 3 << 2; |
1066 | 0 | for (i4 = i0 << 2; i4 <= i__3; i4 += 4) { |
1067 | 0 | if (z__[i4] <= tol2 * z__[i4 - 3] || z__[i4 - 1] <= |
1068 | 0 | tol2 * sigma) { |
1069 | 0 | z__[i4 - 1] = -sigma; |
1070 | 0 | splt = i4 / 4; |
1071 | 0 | qmax = 0.; |
1072 | 0 | emin = z__[i4 + 3]; |
1073 | 0 | oldemn = z__[i4 + 4]; |
1074 | 0 | } else { |
1075 | | /* Computing MAX */ |
1076 | 0 | d__1 = qmax, d__2 = z__[i4 + 1]; |
1077 | 0 | qmax = f2cmax(d__1,d__2); |
1078 | | /* Computing MIN */ |
1079 | 0 | d__1 = emin, d__2 = z__[i4 - 1]; |
1080 | 0 | emin = f2cmin(d__1,d__2); |
1081 | | /* Computing MIN */ |
1082 | 0 | d__1 = oldemn, d__2 = z__[i4]; |
1083 | 0 | oldemn = f2cmin(d__1,d__2); |
1084 | 0 | } |
1085 | | /* L130: */ |
1086 | 0 | } |
1087 | 0 | z__[(n0 << 2) - 1] = emin; |
1088 | 0 | z__[n0 * 4] = oldemn; |
1089 | 0 | i0 = splt + 1; |
1090 | 0 | } |
1091 | 0 | } |
1092 | | |
1093 | | /* L140: */ |
1094 | 0 | } |
1095 | | |
1096 | 0 | *info = 2; |
1097 | | |
1098 | | /* Maximum number of iterations exceeded, restore the shift */ |
1099 | | /* SIGMA and place the new d's and e's in a qd array. */ |
1100 | | /* This might need to be done for several blocks */ |
1101 | |
|
1102 | 0 | i1 = i0; |
1103 | 0 | n1 = n0; |
1104 | 0 | L145: |
1105 | 0 | tempq = z__[(i0 << 2) - 3]; |
1106 | 0 | z__[(i0 << 2) - 3] += sigma; |
1107 | 0 | i__2 = n0; |
1108 | 0 | for (k = i0 + 1; k <= i__2; ++k) { |
1109 | 0 | tempe = z__[(k << 2) - 5]; |
1110 | 0 | z__[(k << 2) - 5] *= tempq / z__[(k << 2) - 7]; |
1111 | 0 | tempq = z__[(k << 2) - 3]; |
1112 | 0 | z__[(k << 2) - 3] = z__[(k << 2) - 3] + sigma + tempe - z__[(k << |
1113 | 0 | 2) - 5]; |
1114 | 0 | } |
1115 | | |
1116 | | /* Prepare to do this on the previous block if there is one */ |
1117 | |
|
1118 | 0 | if (i1 > 1) { |
1119 | 0 | n1 = i1 - 1; |
1120 | 0 | while(i1 >= 2 && z__[(i1 << 2) - 5] >= 0.) { |
1121 | 0 | --i1; |
1122 | 0 | } |
1123 | 0 | sigma = -z__[(n1 << 2) - 1]; |
1124 | 0 | goto L145; |
1125 | 0 | } |
1126 | 0 | i__2 = *n; |
1127 | 0 | for (k = 1; k <= i__2; ++k) { |
1128 | 0 | z__[(k << 1) - 1] = z__[(k << 2) - 3]; |
1129 | | |
1130 | | /* Only the block 1..N0 is unfinished. The rest of the e's */ |
1131 | | /* must be essentially zero, although sometimes other data */ |
1132 | | /* has been stored in them. */ |
1133 | |
|
1134 | 0 | if (k < n0) { |
1135 | 0 | z__[k * 2] = z__[(k << 2) - 1]; |
1136 | 0 | } else { |
1137 | 0 | z__[k * 2] = 0.; |
1138 | 0 | } |
1139 | 0 | } |
1140 | 0 | return; |
1141 | | |
1142 | | /* end IWHILB */ |
1143 | | |
1144 | 0 | L150: |
1145 | | |
1146 | | /* L160: */ |
1147 | 0 | ; |
1148 | 0 | } |
1149 | | |
1150 | 0 | *info = 3; |
1151 | 0 | return; |
1152 | | |
1153 | | /* end IWHILA */ |
1154 | | |
1155 | 0 | L170: |
1156 | | |
1157 | | /* Move q's to the front. */ |
1158 | |
|
1159 | 0 | i__1 = *n; |
1160 | 0 | for (k = 2; k <= i__1; ++k) { |
1161 | 0 | z__[k] = z__[(k << 2) - 3]; |
1162 | | /* L180: */ |
1163 | 0 | } |
1164 | | |
1165 | | /* Sort and compute sum of eigenvalues. */ |
1166 | |
|
1167 | 0 | dlasrt_("D", n, &z__[1], &iinfo); |
1168 | |
|
1169 | 0 | e = 0.; |
1170 | 0 | for (k = *n; k >= 1; --k) { |
1171 | 0 | e += z__[k]; |
1172 | | /* L190: */ |
1173 | 0 | } |
1174 | | |
1175 | | /* Store trace, sum(eigenvalues) and information on performance. */ |
1176 | |
|
1177 | 0 | z__[(*n << 1) + 1] = trace; |
1178 | 0 | z__[(*n << 1) + 2] = e; |
1179 | 0 | z__[(*n << 1) + 3] = (doublereal) iter; |
1180 | | /* Computing 2nd power */ |
1181 | 0 | i__1 = *n; |
1182 | 0 | z__[(*n << 1) + 4] = (doublereal) ndiv / (doublereal) (i__1 * i__1); |
1183 | 0 | z__[(*n << 1) + 5] = nfail * 100. / (doublereal) iter; |
1184 | 0 | return; |
1185 | | |
1186 | | /* End of DLASQ2 */ |
1187 | |
|
1188 | 0 | } /* dlasq2_ */ |
1189 | | |