156 SUBROUTINE ssytri_3x( UPLO, N, A, LDA, E, IPIV, WORK, NB,
165 INTEGER INFO, LDA, N, NB
169 REAL A( LDA, * ), E( * ), WORK( N+NB+1, * )
176 parameter( one = 1.0e+0, zero = 0.0e+0 )
180 INTEGER CUT, I, ICOUNT, INVD, IP, K, NNB, J, U11
181 REAL AK, AKKP1, AKP1, D, T, U01_I_J, U01_IP1_J,
193 INTRINSIC abs, max, mod
200 upper = lsame( uplo,
'U' )
201 IF( .NOT.upper .AND. .NOT.lsame( uplo,
'L' ) )
THEN
203 ELSE IF( n.LT.0 )
THEN
205 ELSE IF( lda.LT.max( 1, n ) )
THEN
212 CALL xerbla(
'SSYTRI_3X', -info )
221 work( k, 1 ) = e( k )
231 IF( ipiv( info ).GT.0 .AND. a( info, info ).EQ.zero )
239 IF( ipiv( info ).GT.0 .AND. a( info, info ).EQ.zero )
265 CALL strtri( uplo,
'U', n, a, lda, info )
271 IF( ipiv( k ).GT.0 )
THEN
273 work( k, invd ) = one / a( k, k )
274 work( k, invd+1 ) = zero
279 akp1 = a( k+1, k+1 ) / t
280 akkp1 = work( k+1, 1 ) / t
281 d = t*( ak*akp1-one )
282 work( k, invd ) = akp1 / d
283 work( k+1, invd+1 ) = ak / d
284 work( k, invd+1 ) = -akkp1 / d
285 work( k+1, invd ) = work( k, invd+1 )
298 IF( cut.LE.nnb )
THEN
303 DO i = cut+1-nnb, cut
304 IF( ipiv( i ).LT.0 ) icount = icount + 1
307 IF( mod( icount, 2 ).EQ.1 ) nnb = nnb + 1
316 work( i, j ) = a( i, cut+j )
323 work( u11+i, i ) = one
325 work( u11+i, j ) = zero
328 work( u11+i, j ) = a( cut+i, cut+j )
336 IF( ipiv( i ).GT.0 )
THEN
338 work( i, j ) = work( i, invd ) * work( i, j )
342 u01_i_j = work( i, j )
343 u01_ip1_j = work( i+1, j )
344 work( i, j ) = work( i, invd ) * u01_i_j
345 $ + work( i, invd+1 ) * u01_ip1_j
346 work( i+1, j ) = work( i+1, invd ) * u01_i_j
347 $ + work( i+1, invd+1 ) * u01_ip1_j
357 DO WHILE ( i.LE.nnb )
358 IF( ipiv( cut+i ).GT.0 )
THEN
360 work( u11+i, j ) = work(cut+i,invd) * work(u11+i,j)
364 u11_i_j = work(u11+i,j)
365 u11_ip1_j = work(u11+i+1,j)
366 work( u11+i, j ) = work(cut+i,invd) * work(u11+i,j)
367 $ + work(cut+i,invd+1) * work(u11+i+1,j)
368 work( u11+i+1, j ) = work(cut+i+1,invd) * u11_i_j
369 $ + work(cut+i+1,invd+1) * u11_ip1_j
378 CALL strmm(
'L',
'U',
'T',
'U', nnb, nnb,
379 $ one, a( cut+1, cut+1 ), lda, work( u11+1, 1 ),
384 a( cut+i, cut+j ) = work( u11+i, j )
390 CALL sgemm(
'T',
'N', nnb, nnb, cut, one, a( 1, cut+1 ),
391 $ lda, work, n+nb+1, zero, work(u11+1,1), n+nb+1 )
398 a( cut+i, cut+j ) = a( cut+i, cut+j ) + work(u11+i,j)
404 CALL strmm(
'L', uplo,
'T',
'U', cut, nnb,
405 $ one, a, lda, work, n+nb+1 )
412 a( i, cut+j ) = work( i, j )
432 ip = abs( ipiv( i ) )
434 IF (i .LT. ip)
CALL ssyswapr( uplo, n, a, lda, i ,
436 IF (i .GT. ip)
CALL ssyswapr( uplo, n, a, lda, ip ,
447 CALL strtri( uplo,
'U', n, a, lda, info )
452 DO WHILE ( k .GE. 1 )
453 IF( ipiv( k ).GT.0 )
THEN
455 work( k, invd ) = one / a( k, k )
456 work( k, invd+1 ) = zero
460 ak = a( k-1, k-1 ) / t
462 akkp1 = work( k-1, 1 ) / t
463 d = t*( ak*akp1-one )
464 work( k-1, invd ) = akp1 / d
465 work( k, invd ) = ak / d
466 work( k, invd+1 ) = -akkp1 / d
467 work( k-1, invd+1 ) = work( k, invd+1 )
480 IF( (cut + nnb).GT.n )
THEN
485 DO i = cut + 1, cut+nnb
486 IF ( ipiv( i ).LT.0 ) icount = icount + 1
489 IF( mod( icount, 2 ).EQ.1 ) nnb = nnb + 1
496 work( i, j ) = a( cut+nnb+i, cut+j )
503 work( u11+i, i) = one
505 work( u11+i, j ) = zero
508 work( u11+i, j ) = a( cut+i, cut+j )
516 IF( ipiv( cut+nnb+i ).GT.0 )
THEN
518 work( i, j ) = work( cut+nnb+i, invd) * work( i, j)
523 u01_ip1_j = work(i-1,j)
524 work(i,j)=work(cut+nnb+i,invd)*u01_i_j+
525 $ work(cut+nnb+i,invd+1)*u01_ip1_j
526 work(i-1,j)=work(cut+nnb+i-1,invd+1)*u01_i_j+
527 $ work(cut+nnb+i-1,invd)*u01_ip1_j
538 IF( ipiv( cut+i ).GT.0 )
THEN
540 work( u11+i, j ) = work( cut+i, invd)*work(u11+i,j)
545 u11_i_j = work( u11+i, j )
546 u11_ip1_j = work( u11+i-1, j )
547 work( u11+i, j ) = work(cut+i,invd) * work(u11+i,j)
548 $ + work(cut+i,invd+1) * u11_ip1_j
549 work( u11+i-1, j ) = work(cut+i-1,invd+1) * u11_i_j
550 $ + work(cut+i-1,invd) * u11_ip1_j
559 CALL strmm(
'L', uplo,
'T',
'U', nnb, nnb, one,
560 $ a( cut+1, cut+1 ), lda, work( u11+1, 1 ),
566 a( cut+i, cut+j ) = work( u11+i, j )
570 IF( (cut+nnb).LT.n )
THEN
574 CALL sgemm(
'T',
'N', nnb, nnb, n-nnb-cut, one,
575 $ a( cut+nnb+1, cut+1 ), lda, work, n+nb+1,
576 $ zero, work( u11+1, 1 ), n+nb+1 )
583 a( cut+i, cut+j ) = a( cut+i, cut+j )+work(u11+i,j)
589 CALL strmm(
'L', uplo,
'T',
'U', n-nnb-cut, nnb, one,
590 $ a( cut+nnb+1, cut+nnb+1 ), lda, work,
597 a( cut+nnb+i, cut+j ) = work( i, j )
607 a( cut+i, cut+j ) = work( u11+i, j )
630 ip = abs( ipiv( i ) )
632 IF (i .LT. ip)
CALL ssyswapr( uplo, n, a, lda, i ,
634 IF (i .GT. ip)
CALL ssyswapr( uplo, n, a, lda, ip ,