LAPACK 3.12.1
LAPACK: Linear Algebra PACKage
Loading...
Searching...
No Matches
csytri_3x.f
Go to the documentation of this file.
1*> \brief \b CSYTRI_3X
2*
3* =========== DOCUMENTATION ===========
4*
5* Online html documentation available at
6* http://www.netlib.org/lapack/explore-html/
7*
8*> Download CSYTRI_3X + dependencies
9*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/csytri_3x.f">
10*> [TGZ]</a>
11*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/csytri_3x.f">
12*> [ZIP]</a>
13*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/csytri_3x.f">
14*> [TXT]</a>
15*
16* Definition:
17* ===========
18*
19* SUBROUTINE CSYTRI_3X( UPLO, N, A, LDA, E, IPIV, WORK, NB, INFO )
20*
21* .. Scalar Arguments ..
22* CHARACTER UPLO
23* INTEGER INFO, LDA, N, NB
24* ..
25* .. Array Arguments ..
26* INTEGER IPIV( * )
27* COMPLEX*16 A( LDA, * ), E( * ), WORK( N+NB+1, * )
28* ..
29*
30*
31*> \par Purpose:
32* =============
33*>
34*> \verbatim
35*> CSYTRI_3X computes the inverse of a complex symmetric indefinite
36*> matrix A using the factorization computed by CSYTRF_RK or CSYTRF_BK:
37*>
38*> A = P*U*D*(U**T)*(P**T) or A = P*L*D*(L**T)*(P**T),
39*>
40*> where U (or L) is unit upper (or lower) triangular matrix,
41*> U**T (or L**T) is the transpose of U (or L), P is a permutation
42*> matrix, P**T is the transpose of P, and D is symmetric and block
43*> diagonal with 1-by-1 and 2-by-2 diagonal blocks.
44*>
45*> This is the blocked version of the algorithm, calling Level 3 BLAS.
46*> \endverbatim
47*
48* Arguments:
49* ==========
50*
51*> \param[in] UPLO
52*> \verbatim
53*> UPLO is CHARACTER*1
54*> Specifies whether the details of the factorization are
55*> stored as an upper or lower triangular matrix.
56*> = 'U': Upper triangle of A is stored;
57*> = 'L': Lower triangle of A is stored.
58*> \endverbatim
59*>
60*> \param[in] N
61*> \verbatim
62*> N is INTEGER
63*> The order of the matrix A. N >= 0.
64*> \endverbatim
65*>
66*> \param[in,out] A
67*> \verbatim
68*> A is COMPLEX array, dimension (LDA,N)
69*> On entry, diagonal of the block diagonal matrix D and
70*> factors U or L as computed by CSYTRF_RK and CSYTRF_BK:
71*> a) ONLY diagonal elements of the symmetric block diagonal
72*> matrix D on the diagonal of A, i.e. D(k,k) = A(k,k);
73*> (superdiagonal (or subdiagonal) elements of D
74*> should be provided on entry in array E), and
75*> b) If UPLO = 'U': factor U in the superdiagonal part of A.
76*> If UPLO = 'L': factor L in the subdiagonal part of A.
77*>
78*> On exit, if INFO = 0, the symmetric inverse of the original
79*> matrix.
80*> If UPLO = 'U': the upper triangular part of the inverse
81*> is formed and the part of A below the diagonal is not
82*> referenced;
83*> If UPLO = 'L': the lower triangular part of the inverse
84*> is formed and the part of A above the diagonal is not
85*> referenced.
86*> \endverbatim
87*>
88*> \param[in] LDA
89*> \verbatim
90*> LDA is INTEGER
91*> The leading dimension of the array A. LDA >= max(1,N).
92*> \endverbatim
93*>
94*> \param[in] E
95*> \verbatim
96*> E is COMPLEX array, dimension (N)
97*> On entry, contains the superdiagonal (or subdiagonal)
98*> elements of the symmetric block diagonal matrix D
99*> with 1-by-1 or 2-by-2 diagonal blocks, where
100*> If UPLO = 'U': E(i) = D(i-1,i), i=2:N, E(1) not referenced;
101*> If UPLO = 'L': E(i) = D(i+1,i), i=1:N-1, E(N) not referenced.
102*>
103*> NOTE: For 1-by-1 diagonal block D(k), where
104*> 1 <= k <= N, the element E(k) is not referenced in both
105*> UPLO = 'U' or UPLO = 'L' cases.
106*> \endverbatim
107*>
108*> \param[in] IPIV
109*> \verbatim
110*> IPIV is INTEGER array, dimension (N)
111*> Details of the interchanges and the block structure of D
112*> as determined by CSYTRF_RK or CSYTRF_BK.
113*> \endverbatim
114*>
115*> \param[out] WORK
116*> \verbatim
117*> WORK is COMPLEX array, dimension (N+NB+1,NB+3).
118*> \endverbatim
119*>
120*> \param[in] NB
121*> \verbatim
122*> NB is INTEGER
123*> Block size.
124*> \endverbatim
125*>
126*> \param[out] INFO
127*> \verbatim
128*> INFO is INTEGER
129*> = 0: successful exit
130*> < 0: if INFO = -i, the i-th argument had an illegal value
131*> > 0: if INFO = i, D(i,i) = 0; the matrix is singular and its
132*> inverse could not be computed.
133*> \endverbatim
134*
135* Authors:
136* ========
137*
138*> \author Univ. of Tennessee
139*> \author Univ. of California Berkeley
140*> \author Univ. of Colorado Denver
141*> \author NAG Ltd.
142*
143*> \ingroup hetri_3x
144*
145*> \par Contributors:
146* ==================
147*> \verbatim
148*>
149*> June 2017, Igor Kozachenko,
150*> Computer Science Division,
151*> University of California, Berkeley
152*>
153*> \endverbatim
154*
155* =====================================================================
156 SUBROUTINE csytri_3x( UPLO, N, A, LDA, E, IPIV, WORK, NB,
157 $ INFO )
158*
159* -- LAPACK computational routine --
160* -- LAPACK is a software package provided by Univ. of Tennessee, --
161* -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
162*
163* .. Scalar Arguments ..
164 CHARACTER UPLO
165 INTEGER INFO, LDA, N, NB
166* ..
167* .. Array Arguments ..
168 INTEGER IPIV( * )
169 COMPLEX A( LDA, * ), E( * ), WORK( N+NB+1, * )
170* ..
171*
172* =====================================================================
173*
174* .. Parameters ..
175 COMPLEX CONE, CZERO
176 parameter( cone = ( 1.0e+0, 0.0e+0 ),
177 $ czero = ( 0.0e+0, 0.0e+0 ) )
178* ..
179* .. Local Scalars ..
180 LOGICAL UPPER
181 INTEGER CUT, I, ICOUNT, INVD, IP, K, NNB, J, U11
182 COMPLEX AK, AKKP1, AKP1, D, T, U01_I_J, U01_IP1_J,
183 $ u11_i_j, u11_ip1_j
184* ..
185* .. External Functions ..
186 LOGICAL LSAME
187 EXTERNAL lsame
188* ..
189* .. External Subroutines ..
190 EXTERNAL cgemm, csyswapr, ctrtri, ctrmm,
191 $ xerbla
192* ..
193* .. Intrinsic Functions ..
194 INTRINSIC abs, max, mod
195* ..
196* .. Executable Statements ..
197*
198* Test the input parameters.
199*
200 info = 0
201 upper = lsame( uplo, 'U' )
202 IF( .NOT.upper .AND. .NOT.lsame( uplo, 'L' ) ) THEN
203 info = -1
204 ELSE IF( n.LT.0 ) THEN
205 info = -2
206 ELSE IF( lda.LT.max( 1, n ) ) THEN
207 info = -4
208 END IF
209*
210* Quick return if possible
211*
212 IF( info.NE.0 ) THEN
213 CALL xerbla( 'CSYTRI_3X', -info )
214 RETURN
215 END IF
216 IF( n.EQ.0 )
217 $ RETURN
218*
219* Workspace got Non-diag elements of D
220*
221 DO k = 1, n
222 work( k, 1 ) = e( k )
223 END DO
224*
225* Check that the diagonal matrix D is nonsingular.
226*
227 IF( upper ) THEN
228*
229* Upper triangular storage: examine D from bottom to top
230*
231 DO info = n, 1, -1
232 IF( ipiv( info ).GT.0 .AND. a( info, info ).EQ.czero )
233 $ RETURN
234 END DO
235 ELSE
236*
237* Lower triangular storage: examine D from top to bottom.
238*
239 DO info = 1, n
240 IF( ipiv( info ).GT.0 .AND. a( info, info ).EQ.czero )
241 $ RETURN
242 END DO
243 END IF
244*
245 info = 0
246*
247* Splitting Workspace
248* U01 is a block ( N, NB+1 )
249* The first element of U01 is in WORK( 1, 1 )
250* U11 is a block ( NB+1, NB+1 )
251* The first element of U11 is in WORK( N+1, 1 )
252*
253 u11 = n
254*
255* INVD is a block ( N, 2 )
256* The first element of INVD is in WORK( 1, INVD )
257*
258 invd = nb + 2
259
260 IF( upper ) THEN
261*
262* Begin Upper
263*
264* invA = P * inv(U**T) * inv(D) * inv(U) * P**T.
265*
266 CALL ctrtri( uplo, 'U', n, a, lda, info )
267*
268* inv(D) and inv(D) * inv(U)
269*
270 k = 1
271 DO WHILE( k.LE.n )
272 IF( ipiv( k ).GT.0 ) THEN
273* 1 x 1 diagonal NNB
274 work( k, invd ) = cone / a( k, k )
275 work( k, invd+1 ) = czero
276 ELSE
277* 2 x 2 diagonal NNB
278 t = work( k+1, 1 )
279 ak = a( k, k ) / t
280 akp1 = a( k+1, k+1 ) / t
281 akkp1 = work( k+1, 1 ) / t
282 d = t*( ak*akp1-cone )
283 work( k, invd ) = akp1 / d
284 work( k+1, invd+1 ) = ak / d
285 work( k, invd+1 ) = -akkp1 / d
286 work( k+1, invd ) = work( k, invd+1 )
287 k = k + 1
288 END IF
289 k = k + 1
290 END DO
291*
292* inv(U**T) = (inv(U))**T
293*
294* inv(U**T) * inv(D) * inv(U)
295*
296 cut = n
297 DO WHILE( cut.GT.0 )
298 nnb = nb
299 IF( cut.LE.nnb ) THEN
300 nnb = cut
301 ELSE
302 icount = 0
303* count negative elements,
304 DO i = cut+1-nnb, cut
305 IF( ipiv( i ).LT.0 ) icount = icount + 1
306 END DO
307* need a even number for a clear cut
308 IF( mod( icount, 2 ).EQ.1 ) nnb = nnb + 1
309 END IF
310
311 cut = cut - nnb
312*
313* U01 Block
314*
315 DO i = 1, cut
316 DO j = 1, nnb
317 work( i, j ) = a( i, cut+j )
318 END DO
319 END DO
320*
321* U11 Block
322*
323 DO i = 1, nnb
324 work( u11+i, i ) = cone
325 DO j = 1, i-1
326 work( u11+i, j ) = czero
327 END DO
328 DO j = i+1, nnb
329 work( u11+i, j ) = a( cut+i, cut+j )
330 END DO
331 END DO
332*
333* invD * U01
334*
335 i = 1
336 DO WHILE( i.LE.cut )
337 IF( ipiv( i ).GT.0 ) THEN
338 DO j = 1, nnb
339 work( i, j ) = work( i, invd ) * work( i, j )
340 END DO
341 ELSE
342 DO j = 1, nnb
343 u01_i_j = work( i, j )
344 u01_ip1_j = work( i+1, j )
345 work( i, j ) = work( i, invd ) * u01_i_j
346 $ + work( i, invd+1 ) * u01_ip1_j
347 work( i+1, j ) = work( i+1, invd ) * u01_i_j
348 $ + work( i+1, invd+1 ) * u01_ip1_j
349 END DO
350 i = i + 1
351 END IF
352 i = i + 1
353 END DO
354*
355* invD1 * U11
356*
357 i = 1
358 DO WHILE ( i.LE.nnb )
359 IF( ipiv( cut+i ).GT.0 ) THEN
360 DO j = i, nnb
361 work( u11+i, j ) = work(cut+i,invd) * work(u11+i,j)
362 END DO
363 ELSE
364 DO j = i, nnb
365 u11_i_j = work(u11+i,j)
366 u11_ip1_j = work(u11+i+1,j)
367 work( u11+i, j ) = work(cut+i,invd) * work(u11+i,j)
368 $ + work(cut+i,invd+1) * work(u11+i+1,j)
369 work( u11+i+1, j ) = work(cut+i+1,invd) * u11_i_j
370 $ + work(cut+i+1,invd+1) * u11_ip1_j
371 END DO
372 i = i + 1
373 END IF
374 i = i + 1
375 END DO
376*
377* U11**T * invD1 * U11 -> U11
378*
379 CALL ctrmm( 'L', 'U', 'T', 'U', nnb, nnb,
380 $ cone, a( cut+1, cut+1 ), lda, work( u11+1, 1 ),
381 $ n+nb+1 )
382*
383 DO i = 1, nnb
384 DO j = i, nnb
385 a( cut+i, cut+j ) = work( u11+i, j )
386 END DO
387 END DO
388*
389* U01**T * invD * U01 -> A( CUT+I, CUT+J )
390*
391 CALL cgemm( 'T', 'N', nnb, nnb, cut, cone, a( 1, cut+1 ),
392 $ lda, work, n+nb+1, czero, work(u11+1,1),
393 $ n+nb+1 )
394
395*
396* U11 = U11**T * invD1 * U11 + U01**T * invD * U01
397*
398 DO i = 1, nnb
399 DO j = i, nnb
400 a( cut+i, cut+j ) = a( cut+i, cut+j ) + work(u11+i,j)
401 END DO
402 END DO
403*
404* U01 = U00**T * invD0 * U01
405*
406 CALL ctrmm( 'L', uplo, 'T', 'U', cut, nnb,
407 $ cone, a, lda, work, n+nb+1 )
408
409*
410* Update U01
411*
412 DO i = 1, cut
413 DO j = 1, nnb
414 a( i, cut+j ) = work( i, j )
415 END DO
416 END DO
417*
418* Next Block
419*
420 END DO
421*
422* Apply PERMUTATIONS P and P**T:
423* P * inv(U**T) * inv(D) * inv(U) * P**T.
424* Interchange rows and columns I and IPIV(I) in reverse order
425* from the formation order of IPIV vector for Upper case.
426*
427* ( We can use a loop over IPIV with increment 1,
428* since the ABS value of IPIV(I) represents the row (column)
429* index of the interchange with row (column) i in both 1x1
430* and 2x2 pivot cases, i.e. we don't need separate code branches
431* for 1x1 and 2x2 pivot cases )
432*
433 DO i = 1, n
434 ip = abs( ipiv( i ) )
435 IF( ip.NE.i ) THEN
436 IF (i .LT. ip) CALL csyswapr( uplo, n, a, lda, i ,
437 $ ip )
438 IF (i .GT. ip) CALL csyswapr( uplo, n, a, lda, ip ,
439 $ i )
440 END IF
441 END DO
442*
443 ELSE
444*
445* Begin Lower
446*
447* inv A = P * inv(L**T) * inv(D) * inv(L) * P**T.
448*
449 CALL ctrtri( uplo, 'U', n, a, lda, info )
450*
451* inv(D) and inv(D) * inv(L)
452*
453 k = n
454 DO WHILE ( k .GE. 1 )
455 IF( ipiv( k ).GT.0 ) THEN
456* 1 x 1 diagonal NNB
457 work( k, invd ) = cone / a( k, k )
458 work( k, invd+1 ) = czero
459 ELSE
460* 2 x 2 diagonal NNB
461 t = work( k-1, 1 )
462 ak = a( k-1, k-1 ) / t
463 akp1 = a( k, k ) / t
464 akkp1 = work( k-1, 1 ) / t
465 d = t*( ak*akp1-cone )
466 work( k-1, invd ) = akp1 / d
467 work( k, invd ) = ak / d
468 work( k, invd+1 ) = -akkp1 / d
469 work( k-1, invd+1 ) = work( k, invd+1 )
470 k = k - 1
471 END IF
472 k = k - 1
473 END DO
474*
475* inv(L**T) = (inv(L))**T
476*
477* inv(L**T) * inv(D) * inv(L)
478*
479 cut = 0
480 DO WHILE( cut.LT.n )
481 nnb = nb
482 IF( (cut + nnb).GT.n ) THEN
483 nnb = n - cut
484 ELSE
485 icount = 0
486* count negative elements,
487 DO i = cut + 1, cut+nnb
488 IF ( ipiv( i ).LT.0 ) icount = icount + 1
489 END DO
490* need a even number for a clear cut
491 IF( mod( icount, 2 ).EQ.1 ) nnb = nnb + 1
492 END IF
493*
494* L21 Block
495*
496 DO i = 1, n-cut-nnb
497 DO j = 1, nnb
498 work( i, j ) = a( cut+nnb+i, cut+j )
499 END DO
500 END DO
501*
502* L11 Block
503*
504 DO i = 1, nnb
505 work( u11+i, i) = cone
506 DO j = i+1, nnb
507 work( u11+i, j ) = czero
508 END DO
509 DO j = 1, i-1
510 work( u11+i, j ) = a( cut+i, cut+j )
511 END DO
512 END DO
513*
514* invD*L21
515*
516 i = n-cut-nnb
517 DO WHILE( i.GE.1 )
518 IF( ipiv( cut+nnb+i ).GT.0 ) THEN
519 DO j = 1, nnb
520 work( i, j ) = work( cut+nnb+i, invd) * work( i, j)
521 END DO
522 ELSE
523 DO j = 1, nnb
524 u01_i_j = work(i,j)
525 u01_ip1_j = work(i-1,j)
526 work(i,j)=work(cut+nnb+i,invd)*u01_i_j+
527 $ work(cut+nnb+i,invd+1)*u01_ip1_j
528 work(i-1,j)=work(cut+nnb+i-1,invd+1)*u01_i_j+
529 $ work(cut+nnb+i-1,invd)*u01_ip1_j
530 END DO
531 i = i - 1
532 END IF
533 i = i - 1
534 END DO
535*
536* invD1*L11
537*
538 i = nnb
539 DO WHILE( i.GE.1 )
540 IF( ipiv( cut+i ).GT.0 ) THEN
541 DO j = 1, nnb
542 work( u11+i, j ) = work( cut+i, invd)*work(u11+i,j)
543 END DO
544
545 ELSE
546 DO j = 1, nnb
547 u11_i_j = work( u11+i, j )
548 u11_ip1_j = work( u11+i-1, j )
549 work( u11+i, j ) = work(cut+i,invd) * work(u11+i,j)
550 $ + work(cut+i,invd+1) * u11_ip1_j
551 work( u11+i-1, j ) = work(cut+i-1,invd+1) * u11_i_j
552 $ + work(cut+i-1,invd) * u11_ip1_j
553 END DO
554 i = i - 1
555 END IF
556 i = i - 1
557 END DO
558*
559* L11**T * invD1 * L11 -> L11
560*
561 CALL ctrmm( 'L', uplo, 'T', 'U', nnb, nnb, cone,
562 $ a( cut+1, cut+1 ), lda, work( u11+1, 1 ),
563 $ n+nb+1 )
564
565*
566 DO i = 1, nnb
567 DO j = 1, i
568 a( cut+i, cut+j ) = work( u11+i, j )
569 END DO
570 END DO
571*
572 IF( (cut+nnb).LT.n ) THEN
573*
574* L21**T * invD2*L21 -> A( CUT+I, CUT+J )
575*
576 CALL cgemm( 'T', 'N', nnb, nnb, n-nnb-cut, cone,
577 $ a( cut+nnb+1, cut+1 ), lda, work, n+nb+1,
578 $ czero, work( u11+1, 1 ), n+nb+1 )
579
580*
581* L11 = L11**T * invD1 * L11 + U01**T * invD * U01
582*
583 DO i = 1, nnb
584 DO j = 1, i
585 a( cut+i, cut+j ) = a( cut+i, cut+j )+work(u11+i,j)
586 END DO
587 END DO
588*
589* L01 = L22**T * invD2 * L21
590*
591 CALL ctrmm( 'L', uplo, 'T', 'U', n-nnb-cut, nnb, cone,
592 $ a( cut+nnb+1, cut+nnb+1 ), lda, work,
593 $ n+nb+1 )
594*
595* Update L21
596*
597 DO i = 1, n-cut-nnb
598 DO j = 1, nnb
599 a( cut+nnb+i, cut+j ) = work( i, j )
600 END DO
601 END DO
602*
603 ELSE
604*
605* L11 = L11**T * invD1 * L11
606*
607 DO i = 1, nnb
608 DO j = 1, i
609 a( cut+i, cut+j ) = work( u11+i, j )
610 END DO
611 END DO
612 END IF
613*
614* Next Block
615*
616 cut = cut + nnb
617*
618 END DO
619*
620* Apply PERMUTATIONS P and P**T:
621* P * inv(L**T) * inv(D) * inv(L) * P**T.
622* Interchange rows and columns I and IPIV(I) in reverse order
623* from the formation order of IPIV vector for Lower case.
624*
625* ( We can use a loop over IPIV with increment -1,
626* since the ABS value of IPIV(I) represents the row (column)
627* index of the interchange with row (column) i in both 1x1
628* and 2x2 pivot cases, i.e. we don't need separate code branches
629* for 1x1 and 2x2 pivot cases )
630*
631 DO i = n, 1, -1
632 ip = abs( ipiv( i ) )
633 IF( ip.NE.i ) THEN
634 IF (i .LT. ip) CALL csyswapr( uplo, n, a, lda, i ,
635 $ ip )
636 IF (i .GT. ip) CALL csyswapr( uplo, n, a, lda, ip ,
637 $ i )
638 END IF
639 END DO
640*
641 END IF
642*
643 RETURN
644*
645* End of CSYTRI_3X
646*
647 END
648
subroutine xerbla(srname, info)
Definition cblat2.f:3285
subroutine cgemm(transa, transb, m, n, k, alpha, a, lda, b, ldb, beta, c, ldc)
CGEMM
Definition cgemm.f:188
subroutine csyswapr(uplo, n, a, lda, i1, i2)
CSYSWAPR
Definition csyswapr.f:98
subroutine csytri_3x(uplo, n, a, lda, e, ipiv, work, nb, info)
CSYTRI_3X
Definition csytri_3x.f:158
subroutine ctrmm(side, uplo, transa, diag, m, n, alpha, a, lda, b, ldb)
CTRMM
Definition ctrmm.f:177
subroutine ctrtri(uplo, diag, n, a, lda, info)
CTRTRI
Definition ctrtri.f:107