LAPACK 3.12.1
LAPACK: Linear Algebra PACKage
Loading...
Searching...
No Matches
cheevd_2stage.f
Go to the documentation of this file.
1*> \brief <b> CHEEVD_2STAGE computes the eigenvalues and, optionally, the left and/or right eigenvectors for HE matrices</b>
2*
3* @generated from zheevd_2stage.f, fortran z -> c, Sat Nov 5 23:18:14 2016
4*
5* =========== DOCUMENTATION ===========
6*
7* Online html documentation available at
8* http://www.netlib.org/lapack/explore-html/
9*
10*> Download CHEEVD_2STAGE + dependencies
11*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/cheevd_2stage.f">
12*> [TGZ]</a>
13*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/cheevd_2stage.f">
14*> [ZIP]</a>
15*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/cheevd_2stage.f">
16*> [TXT]</a>
17*
18* Definition:
19* ===========
20*
21* SUBROUTINE CHEEVD_2STAGE( JOBZ, UPLO, N, A, LDA, W, WORK, LWORK,
22* RWORK, LRWORK, IWORK, LIWORK, INFO )
23*
24* IMPLICIT NONE
25*
26* .. Scalar Arguments ..
27* CHARACTER JOBZ, UPLO
28* INTEGER INFO, LDA, LIWORK, LRWORK, LWORK, N
29* ..
30* .. Array Arguments ..
31* INTEGER IWORK( * )
32* REAL RWORK( * ), W( * )
33* COMPLEX A( LDA, * ), WORK( * )
34* ..
35*
36*
37*> \par Purpose:
38* =============
39*>
40*> \verbatim
41*>
42*> CHEEVD_2STAGE computes all eigenvalues and, optionally, eigenvectors of a
43*> complex Hermitian matrix A using the 2stage technique for
44*> the reduction to tridiagonal. If eigenvectors are desired, it uses a
45*> divide and conquer algorithm.
46*>
47*> \endverbatim
48*
49* Arguments:
50* ==========
51*
52*> \param[in] JOBZ
53*> \verbatim
54*> JOBZ is CHARACTER*1
55*> = 'N': Compute eigenvalues only;
56*> = 'V': Compute eigenvalues and eigenvectors.
57*> Not available in this release.
58*> \endverbatim
59*>
60*> \param[in] UPLO
61*> \verbatim
62*> UPLO is CHARACTER*1
63*> = 'U': Upper triangle of A is stored;
64*> = 'L': Lower triangle of A is stored.
65*> \endverbatim
66*>
67*> \param[in] N
68*> \verbatim
69*> N is INTEGER
70*> The order of the matrix A. N >= 0.
71*> \endverbatim
72*>
73*> \param[in,out] A
74*> \verbatim
75*> A is COMPLEX array, dimension (LDA, N)
76*> On entry, the Hermitian matrix A. If UPLO = 'U', the
77*> leading N-by-N upper triangular part of A contains the
78*> upper triangular part of the matrix A. If UPLO = 'L',
79*> the leading N-by-N lower triangular part of A contains
80*> the lower triangular part of the matrix A.
81*> On exit, if JOBZ = 'V', then if INFO = 0, A contains the
82*> orthonormal eigenvectors of the matrix A.
83*> If JOBZ = 'N', then on exit the lower triangle (if UPLO='L')
84*> or the upper triangle (if UPLO='U') of A, including the
85*> diagonal, is destroyed.
86*> \endverbatim
87*>
88*> \param[in] LDA
89*> \verbatim
90*> LDA is INTEGER
91*> The leading dimension of the array A. LDA >= max(1,N).
92*> \endverbatim
93*>
94*> \param[out] W
95*> \verbatim
96*> W is REAL array, dimension (N)
97*> If INFO = 0, the eigenvalues in ascending order.
98*> \endverbatim
99*>
100*> \param[out] WORK
101*> \verbatim
102*> WORK is COMPLEX array, dimension (MAX(1,LWORK))
103*> On exit, if INFO = 0, WORK(1) returns the optimal LWORK.
104*> \endverbatim
105*>
106*> \param[in] LWORK
107*> \verbatim
108*> LWORK is INTEGER
109*> The dimension of the array WORK.
110*> If N <= 1, LWORK must be at least 1.
111*> If JOBZ = 'N' and N > 1, LWORK must be queried.
112*> LWORK = MAX(1, dimension) where
113*> dimension = max(stage1,stage2) + (KD+1)*N + N+1
114*> = N*KD + N*max(KD+1,FACTOPTNB)
115*> + max(2*KD*KD, KD*NTHREADS)
116*> + (KD+1)*N + N+1
117*> where KD is the blocking size of the reduction,
118*> FACTOPTNB is the blocking used by the QR or LQ
119*> algorithm, usually FACTOPTNB=128 is a good choice
120*> NTHREADS is the number of threads used when
121*> openMP compilation is enabled, otherwise =1.
122*> If JOBZ = 'V' and N > 1, LWORK must be at least 2*N + N**2
123*>
124*> If LWORK = -1, then a workspace query is assumed; the routine
125*> only calculates the optimal sizes of the WORK, RWORK and
126*> IWORK arrays, returns these values as the first entries of
127*> the WORK, RWORK and IWORK arrays, and no error message
128*> related to LWORK or LRWORK or LIWORK is issued by XERBLA.
129*> \endverbatim
130*>
131*> \param[out] RWORK
132*> \verbatim
133*> RWORK is REAL array,
134*> dimension (LRWORK)
135*> On exit, if INFO = 0, RWORK(1) returns the optimal LRWORK.
136*> \endverbatim
137*>
138*> \param[in] LRWORK
139*> \verbatim
140*> LRWORK is INTEGER
141*> The dimension of the array RWORK.
142*> If N <= 1, LRWORK must be at least 1.
143*> If JOBZ = 'N' and N > 1, LRWORK must be at least N.
144*> If JOBZ = 'V' and N > 1, LRWORK must be at least
145*> 1 + 5*N + 2*N**2.
146*>
147*> If LRWORK = -1, then a workspace query is assumed; the
148*> routine only calculates the optimal sizes of the WORK, RWORK
149*> and IWORK arrays, returns these values as the first entries
150*> of the WORK, RWORK and IWORK arrays, and no error message
151*> related to LWORK or LRWORK or LIWORK is issued by XERBLA.
152*> \endverbatim
153*>
154*> \param[out] IWORK
155*> \verbatim
156*> IWORK is INTEGER array, dimension (MAX(1,LIWORK))
157*> On exit, if INFO = 0, IWORK(1) returns the optimal LIWORK.
158*> \endverbatim
159*>
160*> \param[in] LIWORK
161*> \verbatim
162*> LIWORK is INTEGER
163*> The dimension of the array IWORK.
164*> If N <= 1, LIWORK must be at least 1.
165*> If JOBZ = 'N' and N > 1, LIWORK must be at least 1.
166*> If JOBZ = 'V' and N > 1, LIWORK must be at least 3 + 5*N.
167*>
168*> If LIWORK = -1, then a workspace query is assumed; the
169*> routine only calculates the optimal sizes of the WORK, RWORK
170*> and IWORK arrays, returns these values as the first entries
171*> of the WORK, RWORK and IWORK arrays, and no error message
172*> related to LWORK or LRWORK or LIWORK is issued by XERBLA.
173*> \endverbatim
174*>
175*> \param[out] INFO
176*> \verbatim
177*> INFO is INTEGER
178*> = 0: successful exit
179*> < 0: if INFO = -i, the i-th argument had an illegal value
180*> > 0: if INFO = i and JOBZ = 'N', then the algorithm failed
181*> to converge; i off-diagonal elements of an intermediate
182*> tridiagonal form did not converge to zero;
183*> if INFO = i and JOBZ = 'V', then the algorithm failed
184*> to compute an eigenvalue while working on the submatrix
185*> lying in rows and columns INFO/(N+1) through
186*> mod(INFO,N+1).
187*> \endverbatim
188*
189* Authors:
190* ========
191*
192*> \author Univ. of Tennessee
193*> \author Univ. of California Berkeley
194*> \author Univ. of Colorado Denver
195*> \author NAG Ltd.
196*
197*> \ingroup heevd_2stage
198*
199*> \par Further Details:
200* =====================
201*>
202*> Modified description of INFO. Sven, 16 Feb 05.
203*
204*> \par Contributors:
205* ==================
206*>
207*> Jeff Rutter, Computer Science Division, University of California
208*> at Berkeley, USA
209*>
210*> \par Further Details:
211* =====================
212*>
213*> \verbatim
214*>
215*> All details about the 2stage techniques are available in:
216*>
217*> Azzam Haidar, Hatem Ltaief, and Jack Dongarra.
218*> Parallel reduction to condensed forms for symmetric eigenvalue problems
219*> using aggregated fine-grained and memory-aware kernels. In Proceedings
220*> of 2011 International Conference for High Performance Computing,
221*> Networking, Storage and Analysis (SC '11), New York, NY, USA,
222*> Article 8 , 11 pages.
223*> http://doi.acm.org/10.1145/2063384.2063394
224*>
225*> A. Haidar, J. Kurzak, P. Luszczek, 2013.
226*> An improved parallel singular value algorithm and its implementation
227*> for multicore hardware, In Proceedings of 2013 International Conference
228*> for High Performance Computing, Networking, Storage and Analysis (SC '13).
229*> Denver, Colorado, USA, 2013.
230*> Article 90, 12 pages.
231*> http://doi.acm.org/10.1145/2503210.2503292
232*>
233*> A. Haidar, R. Solca, S. Tomov, T. Schulthess and J. Dongarra.
234*> A novel hybrid CPU-GPU generalized eigensolver for electronic structure
235*> calculations based on fine-grained memory aware tasks.
236*> International Journal of High Performance Computing Applications.
237*> Volume 28 Issue 2, Pages 196-209, May 2014.
238*> http://hpc.sagepub.com/content/28/2/196
239*>
240*> \endverbatim
241*
242* =====================================================================
243 SUBROUTINE cheevd_2stage( JOBZ, UPLO, N, A, LDA, W, WORK,
244 $ LWORK,
245 $ RWORK, LRWORK, IWORK, LIWORK, INFO )
246*
247 IMPLICIT NONE
248*
249* -- LAPACK driver routine --
250* -- LAPACK is a software package provided by Univ. of Tennessee, --
251* -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
252*
253* .. Scalar Arguments ..
254 CHARACTER JOBZ, UPLO
255 INTEGER INFO, LDA, LIWORK, LRWORK, LWORK, N
256* ..
257* .. Array Arguments ..
258 INTEGER IWORK( * )
259 REAL RWORK( * ), W( * )
260 COMPLEX A( LDA, * ), WORK( * )
261* ..
262*
263* =====================================================================
264*
265* .. Parameters ..
266 REAL ZERO, ONE
267 PARAMETER ( ZERO = 0.0e0, one = 1.0e0 )
268 COMPLEX CONE
269 parameter( cone = ( 1.0e0, 0.0e0 ) )
270* ..
271* .. Local Scalars ..
272 LOGICAL LOWER, LQUERY, WANTZ
273 INTEGER IINFO, IMAX, INDE, INDRWK, INDTAU, INDWK2,
274 $ indwrk, iscale, liwmin, llrwk, llwork,
275 $ llwrk2, lrwmin, lwmin,
276 $ lhtrd, lwtrd, kd, ib, indhous
277
278
279 REAL ANRM, BIGNUM, EPS, RMAX, RMIN, SAFMIN, SIGMA,
280 $ SMLNUM
281* ..
282* .. External Functions ..
283 LOGICAL LSAME
284 INTEGER ILAENV2STAGE
285 REAL SLAMCH, CLANHE
286 EXTERNAL lsame, slamch, clanhe, ilaenv2stage
287* ..
288* .. External Subroutines ..
289 EXTERNAL sscal, ssterf, xerbla, clacpy,
290 $ clascl,
292* ..
293* .. Intrinsic Functions ..
294 INTRINSIC real, max, sqrt
295* ..
296* .. Executable Statements ..
297*
298* Test the input parameters.
299*
300 wantz = lsame( jobz, 'V' )
301 lower = lsame( uplo, 'L' )
302 lquery = ( lwork.EQ.-1 .OR. lrwork.EQ.-1 .OR. liwork.EQ.-1 )
303*
304 info = 0
305 IF( .NOT.( lsame( jobz, 'N' ) ) ) THEN
306 info = -1
307 ELSE IF( .NOT.( lower .OR. lsame( uplo, 'U' ) ) ) THEN
308 info = -2
309 ELSE IF( n.LT.0 ) THEN
310 info = -3
311 ELSE IF( lda.LT.max( 1, n ) ) THEN
312 info = -5
313 END IF
314*
315 IF( info.EQ.0 ) THEN
316 IF( n.LE.1 ) THEN
317 lwmin = 1
318 lrwmin = 1
319 liwmin = 1
320 ELSE
321 kd = ilaenv2stage( 1, 'CHETRD_2STAGE', jobz,
322 $ n, -1, -1, -1 )
323 ib = ilaenv2stage( 2, 'CHETRD_2STAGE', jobz,
324 $ n, kd, -1, -1 )
325 lhtrd = ilaenv2stage( 3, 'CHETRD_2STAGE', jobz,
326 $ n, kd, ib, -1 )
327 lwtrd = ilaenv2stage( 4, 'CHETRD_2STAGE', jobz,
328 $ n, kd, ib, -1 )
329 IF( wantz ) THEN
330 lwmin = 2*n + n*n
331 lrwmin = 1 + 5*n + 2*n**2
332 liwmin = 3 + 5*n
333 ELSE
334 lwmin = n + 1 + lhtrd + lwtrd
335 lrwmin = n
336 liwmin = 1
337 END IF
338 END IF
339 work( 1 ) = cmplx( lwmin )
340 rwork( 1 ) = real( lrwmin )
341 iwork( 1 ) = liwmin
342*
343 IF( lwork.LT.lwmin .AND. .NOT.lquery ) THEN
344 info = -8
345 ELSE IF( lrwork.LT.lrwmin .AND. .NOT.lquery ) THEN
346 info = -10
347 ELSE IF( liwork.LT.liwmin .AND. .NOT.lquery ) THEN
348 info = -12
349 END IF
350 END IF
351*
352 IF( info.NE.0 ) THEN
353 CALL xerbla( 'CHEEVD_2STAGE', -info )
354 RETURN
355 ELSE IF( lquery ) THEN
356 RETURN
357 END IF
358*
359* Quick return if possible
360*
361 IF( n.EQ.0 )
362 $ RETURN
363*
364 IF( n.EQ.1 ) THEN
365 w( 1 ) = real( a( 1, 1 ) )
366 IF( wantz )
367 $ a( 1, 1 ) = cone
368 RETURN
369 END IF
370*
371* Get machine constants.
372*
373 safmin = slamch( 'Safe minimum' )
374 eps = slamch( 'Precision' )
375 smlnum = safmin / eps
376 bignum = one / smlnum
377 rmin = sqrt( smlnum )
378 rmax = sqrt( bignum )
379*
380* Scale matrix to allowable range, if necessary.
381*
382 anrm = clanhe( 'M', uplo, n, a, lda, rwork )
383 iscale = 0
384 IF( anrm.GT.zero .AND. anrm.LT.rmin ) THEN
385 iscale = 1
386 sigma = rmin / anrm
387 ELSE IF( anrm.GT.rmax ) THEN
388 iscale = 1
389 sigma = rmax / anrm
390 END IF
391 IF( iscale.EQ.1 )
392 $ CALL clascl( uplo, 0, 0, one, sigma, n, n, a, lda, info )
393*
394* Call CHETRD_2STAGE to reduce Hermitian matrix to tridiagonal form.
395*
396 inde = 1
397 indrwk = inde + n
398 llrwk = lrwork - indrwk + 1
399 indtau = 1
400 indhous = indtau + n
401 indwrk = indhous + lhtrd
402 llwork = lwork - indwrk + 1
403 indwk2 = indwrk + n*n
404 llwrk2 = lwork - indwk2 + 1
405*
406 CALL chetrd_2stage( jobz, uplo, n, a, lda, w, rwork( inde ),
407 $ work( indtau ), work( indhous ), lhtrd,
408 $ work( indwrk ), llwork, iinfo )
409*
410* For eigenvalues only, call SSTERF. For eigenvectors, first call
411* CSTEDC to generate the eigenvector matrix, WORK(INDWRK), of the
412* tridiagonal matrix, then call CUNMTR to multiply it to the
413* Householder transformations represented as Householder vectors in
414* A.
415*
416 IF( .NOT.wantz ) THEN
417 CALL ssterf( n, w, rwork( inde ), info )
418 ELSE
419 CALL cstedc( 'I', n, w, rwork( inde ), work( indwrk ), n,
420 $ work( indwk2 ), llwrk2, rwork( indrwk ), llrwk,
421 $ iwork, liwork, info )
422 CALL cunmtr( 'L', uplo, 'N', n, n, a, lda, work( indtau ),
423 $ work( indwrk ), n, work( indwk2 ), llwrk2, iinfo )
424 CALL clacpy( 'A', n, n, work( indwrk ), n, a, lda )
425 END IF
426*
427* If matrix was scaled, then rescale eigenvalues appropriately.
428*
429 IF( iscale.EQ.1 ) THEN
430 IF( info.EQ.0 ) THEN
431 imax = n
432 ELSE
433 imax = info - 1
434 END IF
435 CALL sscal( imax, one / sigma, w, 1 )
436 END IF
437*
438 work( 1 ) = cmplx( lwmin )
439 rwork( 1 ) = real( lrwmin )
440 iwork( 1 ) = liwmin
441*
442 RETURN
443*
444* End of CHEEVD_2STAGE
445*
446 END
subroutine xerbla(srname, info)
Definition cblat2.f:3285
subroutine cheevd_2stage(jobz, uplo, n, a, lda, w, work, lwork, rwork, lrwork, iwork, liwork, info)
CHEEVD_2STAGE computes the eigenvalues and, optionally, the left and/or right eigenvectors for HE mat...
subroutine chetrd_2stage(vect, uplo, n, a, lda, d, e, tau, hous2, lhous2, work, lwork, info)
CHETRD_2STAGE
subroutine clacpy(uplo, m, n, a, lda, b, ldb)
CLACPY copies all or part of one two-dimensional array to another.
Definition clacpy.f:101
subroutine clascl(type, kl, ku, cfrom, cto, m, n, a, lda, info)
CLASCL multiplies a general rectangular matrix by a real scalar defined as cto/cfrom.
Definition clascl.f:142
subroutine sscal(n, sa, sx, incx)
SSCAL
Definition sscal.f:79
subroutine cstedc(compz, n, d, e, z, ldz, work, lwork, rwork, lrwork, iwork, liwork, info)
CSTEDC
Definition cstedc.f:204
subroutine ssterf(n, d, e, info)
SSTERF
Definition ssterf.f:84
subroutine cunmtr(side, uplo, trans, m, n, a, lda, tau, c, ldc, work, lwork, info)
CUNMTR
Definition cunmtr.f:171