version 1.13, 2014/01/27 09:28:18
|
version 1.14, 2015/11/26 11:44:17
|
Line 1
|
Line 1
|
*> \brief \b DGSVJ0 pre-processor for the routine sgesvj. |
*> \brief \b DGSVJ0 pre-processor for the routine dgesvj. |
* |
* |
* =========== DOCUMENTATION =========== |
* =========== DOCUMENTATION =========== |
* |
* |
Line 193
|
Line 193
|
*> \author Univ. of Colorado Denver |
*> \author Univ. of Colorado Denver |
*> \author NAG Ltd. |
*> \author NAG Ltd. |
* |
* |
*> \date September 2012 |
*> \date November 2015 |
* |
* |
*> \ingroup doubleOTHERcomputational |
*> \ingroup doubleOTHERcomputational |
* |
* |
Line 218
|
Line 218
|
SUBROUTINE DGSVJ0( JOBV, M, N, A, LDA, D, SVA, MV, V, LDV, EPS, |
SUBROUTINE DGSVJ0( JOBV, M, N, A, LDA, D, SVA, MV, V, LDV, EPS, |
$ SFMIN, TOL, NSWEEP, WORK, LWORK, INFO ) |
$ SFMIN, TOL, NSWEEP, WORK, LWORK, INFO ) |
* |
* |
* -- LAPACK computational routine (version 3.4.2) -- |
* -- LAPACK computational routine (version 3.6.0) -- |
* -- LAPACK is a software package provided by Univ. of Tennessee, -- |
* -- LAPACK is a software package provided by Univ. of Tennessee, -- |
* -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..-- |
* -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..-- |
* September 2012 |
* November 2015 |
* |
* |
* .. Scalar Arguments .. |
* .. Scalar Arguments .. |
INTEGER INFO, LDA, LDV, LWORK, M, MV, N, NSWEEP |
INTEGER INFO, LDA, LDV, LWORK, M, MV, N, NSWEEP |
Line 253
|
Line 253
|
DOUBLE PRECISION FASTR( 5 ) |
DOUBLE PRECISION FASTR( 5 ) |
* .. |
* .. |
* .. Intrinsic Functions .. |
* .. Intrinsic Functions .. |
INTRINSIC DABS, DMAX1, DBLE, MIN0, DSIGN, DSQRT |
INTRINSIC DABS, MAX, DBLE, MIN, DSIGN, DSQRT |
* .. |
* .. |
* .. External Functions .. |
* .. External Functions .. |
DOUBLE PRECISION DDOT, DNRM2 |
DOUBLE PRECISION DDOT, DNRM2 |
Line 329
|
Line 329
|
* Jacobi SVD algorithm SGESVJ. For sweeps i=1:SWBAND the procedure |
* Jacobi SVD algorithm SGESVJ. For sweeps i=1:SWBAND the procedure |
* ...... |
* ...... |
|
|
KBL = MIN0( 8, N ) |
KBL = MIN( 8, N ) |
*[TP] KBL is a tuning parameter that defines the tile size in the |
*[TP] KBL is a tuning parameter that defines the tile size in the |
* tiling of the p-q loops of pivot pairs. In general, an optimal |
* tiling of the p-q loops of pivot pairs. In general, an optimal |
* value of KBL depends on the matrix dimensions and on the |
* value of KBL depends on the matrix dimensions and on the |
Line 341
|
Line 341
|
BLSKIP = ( KBL**2 ) + 1 |
BLSKIP = ( KBL**2 ) + 1 |
*[TP] BLKSKIP is a tuning parameter that depends on SWBAND and KBL. |
*[TP] BLKSKIP is a tuning parameter that depends on SWBAND and KBL. |
|
|
ROWSKIP = MIN0( 5, KBL ) |
ROWSKIP = MIN( 5, KBL ) |
*[TP] ROWSKIP is a tuning parameter. |
*[TP] ROWSKIP is a tuning parameter. |
|
|
LKAHEAD = 1 |
LKAHEAD = 1 |
Line 363
|
Line 363
|
|
|
igl = ( ibr-1 )*KBL + 1 |
igl = ( ibr-1 )*KBL + 1 |
* |
* |
DO 1002 ir1 = 0, MIN0( LKAHEAD, NBL-ibr ) |
DO 1002 ir1 = 0, MIN( LKAHEAD, NBL-ibr ) |
* |
* |
igl = igl + ir1*KBL |
igl = igl + ir1*KBL |
* |
* |
DO 2001 p = igl, MIN0( igl+KBL-1, N-1 ) |
DO 2001 p = igl, MIN( igl+KBL-1, N-1 ) |
|
|
* .. de Rijk's pivoting |
* .. de Rijk's pivoting |
q = IDAMAX( N-p+1, SVA( p ), 1 ) + p - 1 |
q = IDAMAX( N-p+1, SVA( p ), 1 ) + p - 1 |
Line 416
|
Line 416
|
* |
* |
PSKIPPED = 0 |
PSKIPPED = 0 |
* |
* |
DO 2002 q = p + 1, MIN0( igl+KBL-1, N ) |
DO 2002 q = p + 1, MIN( igl+KBL-1, N ) |
* |
* |
AAQQ = SVA( q ) |
AAQQ = SVA( q ) |
|
|
Line 451
|
Line 451
|
END IF |
END IF |
END IF |
END IF |
* |
* |
MXAAPQ = DMAX1( MXAAPQ, DABS( AAPQ ) ) |
MXAAPQ = MAX( MXAAPQ, DABS( AAPQ ) ) |
* |
* |
* TO rotate or NOT to rotate, THAT is the question ... |
* TO rotate or NOT to rotate, THAT is the question ... |
* |
* |
Line 483
|
Line 483
|
$ V( 1, p ), 1, |
$ V( 1, p ), 1, |
$ V( 1, q ), 1, |
$ V( 1, q ), 1, |
$ FASTR ) |
$ FASTR ) |
SVA( q ) = AAQQ*DSQRT( DMAX1( ZERO, |
SVA( q ) = AAQQ*DSQRT( MAX( ZERO, |
$ ONE+T*APOAQ*AAPQ ) ) |
$ ONE+T*APOAQ*AAPQ ) ) |
AAPP = AAPP*DSQRT( DMAX1( ZERO, |
AAPP = AAPP*DSQRT( MAX( ZERO, |
$ ONE-T*AQOAP*AAPQ ) ) |
$ ONE-T*AQOAP*AAPQ ) ) |
MXSINJ = DMAX1( MXSINJ, DABS( T ) ) |
MXSINJ = MAX( MXSINJ, DABS( T ) ) |
* |
* |
ELSE |
ELSE |
* |
* |
Line 499
|
Line 499
|
CS = DSQRT( ONE / ( ONE+T*T ) ) |
CS = DSQRT( ONE / ( ONE+T*T ) ) |
SN = T*CS |
SN = T*CS |
* |
* |
MXSINJ = DMAX1( MXSINJ, DABS( SN ) ) |
MXSINJ = MAX( MXSINJ, DABS( SN ) ) |
SVA( q ) = AAQQ*DSQRT( DMAX1( ZERO, |
SVA( q ) = AAQQ*DSQRT( MAX( ZERO, |
$ ONE+T*APOAQ*AAPQ ) ) |
$ ONE+T*APOAQ*AAPQ ) ) |
AAPP = AAPP*DSQRT( DMAX1( ZERO, |
AAPP = AAPP*DSQRT( MAX( ZERO, |
$ ONE-T*AQOAP*AAPQ ) ) |
$ ONE-T*AQOAP*AAPQ ) ) |
* |
* |
APOAQ = D( p ) / D( q ) |
APOAQ = D( p ) / D( q ) |
Line 613
|
Line 613
|
$ A( 1, q ), 1 ) |
$ A( 1, q ), 1 ) |
CALL DLASCL( 'G', 0, 0, ONE, AAQQ, M, |
CALL DLASCL( 'G', 0, 0, ONE, AAQQ, M, |
$ 1, A( 1, q ), LDA, IERR ) |
$ 1, A( 1, q ), LDA, IERR ) |
SVA( q ) = AAQQ*DSQRT( DMAX1( ZERO, |
SVA( q ) = AAQQ*DSQRT( MAX( ZERO, |
$ ONE-AAPQ*AAPQ ) ) |
$ ONE-AAPQ*AAPQ ) ) |
MXSINJ = DMAX1( MXSINJ, SFMIN ) |
MXSINJ = MAX( MXSINJ, SFMIN ) |
END IF |
END IF |
* END IF ROTOK THEN ... ELSE |
* END IF ROTOK THEN ... ELSE |
* |
* |
Line 679
|
Line 679
|
ELSE |
ELSE |
SVA( p ) = AAPP |
SVA( p ) = AAPP |
IF( ( ir1.EQ.0 ) .AND. ( AAPP.EQ.ZERO ) ) |
IF( ( ir1.EQ.0 ) .AND. ( AAPP.EQ.ZERO ) ) |
$ NOTROT = NOTROT + MIN0( igl+KBL-1, N ) - p |
$ NOTROT = NOTROT + MIN( igl+KBL-1, N ) - p |
END IF |
END IF |
* |
* |
2001 CONTINUE |
2001 CONTINUE |
Line 700
|
Line 700
|
* doing the block at ( ibr, jbc ) |
* doing the block at ( ibr, jbc ) |
* |
* |
IJBLSK = 0 |
IJBLSK = 0 |
DO 2100 p = igl, MIN0( igl+KBL-1, N ) |
DO 2100 p = igl, MIN( igl+KBL-1, N ) |
* |
* |
AAPP = SVA( p ) |
AAPP = SVA( p ) |
* |
* |
Line 708
|
Line 708
|
* |
* |
PSKIPPED = 0 |
PSKIPPED = 0 |
* |
* |
DO 2200 q = jgl, MIN0( jgl+KBL-1, N ) |
DO 2200 q = jgl, MIN( jgl+KBL-1, N ) |
* |
* |
AAQQ = SVA( q ) |
AAQQ = SVA( q ) |
* |
* |
Line 755
|
Line 755
|
END IF |
END IF |
END IF |
END IF |
* |
* |
MXAAPQ = DMAX1( MXAAPQ, DABS( AAPQ ) ) |
MXAAPQ = MAX( MXAAPQ, DABS( AAPQ ) ) |
* |
* |
* TO rotate or NOT to rotate, THAT is the question ... |
* TO rotate or NOT to rotate, THAT is the question ... |
* |
* |
Line 782
|
Line 782
|
$ V( 1, p ), 1, |
$ V( 1, p ), 1, |
$ V( 1, q ), 1, |
$ V( 1, q ), 1, |
$ FASTR ) |
$ FASTR ) |
SVA( q ) = AAQQ*DSQRT( DMAX1( ZERO, |
SVA( q ) = AAQQ*DSQRT( MAX( ZERO, |
$ ONE+T*APOAQ*AAPQ ) ) |
$ ONE+T*APOAQ*AAPQ ) ) |
AAPP = AAPP*DSQRT( DMAX1( ZERO, |
AAPP = AAPP*DSQRT( MAX( ZERO, |
$ ONE-T*AQOAP*AAPQ ) ) |
$ ONE-T*AQOAP*AAPQ ) ) |
MXSINJ = DMAX1( MXSINJ, DABS( T ) ) |
MXSINJ = MAX( MXSINJ, DABS( T ) ) |
ELSE |
ELSE |
* |
* |
* .. choose correct signum for THETA and rotate |
* .. choose correct signum for THETA and rotate |
Line 797
|
Line 797
|
$ DSQRT( ONE+THETA*THETA ) ) |
$ DSQRT( ONE+THETA*THETA ) ) |
CS = DSQRT( ONE / ( ONE+T*T ) ) |
CS = DSQRT( ONE / ( ONE+T*T ) ) |
SN = T*CS |
SN = T*CS |
MXSINJ = DMAX1( MXSINJ, DABS( SN ) ) |
MXSINJ = MAX( MXSINJ, DABS( SN ) ) |
SVA( q ) = AAQQ*DSQRT( DMAX1( ZERO, |
SVA( q ) = AAQQ*DSQRT( MAX( ZERO, |
$ ONE+T*APOAQ*AAPQ ) ) |
$ ONE+T*APOAQ*AAPQ ) ) |
AAPP = AAPP*DSQRT( DMAX1( ZERO, |
AAPP = AAPP*DSQRT( MAX( ZERO, |
$ ONE-T*AQOAP*AAPQ ) ) |
$ ONE-T*AQOAP*AAPQ ) ) |
* |
* |
APOAQ = D( p ) / D( q ) |
APOAQ = D( p ) / D( q ) |
Line 915
|
Line 915
|
CALL DLASCL( 'G', 0, 0, ONE, AAQQ, |
CALL DLASCL( 'G', 0, 0, ONE, AAQQ, |
$ M, 1, A( 1, q ), LDA, |
$ M, 1, A( 1, q ), LDA, |
$ IERR ) |
$ IERR ) |
SVA( q ) = AAQQ*DSQRT( DMAX1( ZERO, |
SVA( q ) = AAQQ*DSQRT( MAX( ZERO, |
$ ONE-AAPQ*AAPQ ) ) |
$ ONE-AAPQ*AAPQ ) ) |
MXSINJ = DMAX1( MXSINJ, SFMIN ) |
MXSINJ = MAX( MXSINJ, SFMIN ) |
ELSE |
ELSE |
CALL DCOPY( M, A( 1, q ), 1, WORK, |
CALL DCOPY( M, A( 1, q ), 1, WORK, |
$ 1 ) |
$ 1 ) |
Line 932
|
Line 932
|
CALL DLASCL( 'G', 0, 0, ONE, AAPP, |
CALL DLASCL( 'G', 0, 0, ONE, AAPP, |
$ M, 1, A( 1, p ), LDA, |
$ M, 1, A( 1, p ), LDA, |
$ IERR ) |
$ IERR ) |
SVA( p ) = AAPP*DSQRT( DMAX1( ZERO, |
SVA( p ) = AAPP*DSQRT( MAX( ZERO, |
$ ONE-AAPQ*AAPQ ) ) |
$ ONE-AAPQ*AAPQ ) ) |
MXSINJ = DMAX1( MXSINJ, SFMIN ) |
MXSINJ = MAX( MXSINJ, SFMIN ) |
END IF |
END IF |
END IF |
END IF |
* END IF ROTOK THEN ... ELSE |
* END IF ROTOK THEN ... ELSE |
Line 1002
|
Line 1002
|
* |
* |
ELSE |
ELSE |
IF( AAPP.EQ.ZERO )NOTROT = NOTROT + |
IF( AAPP.EQ.ZERO )NOTROT = NOTROT + |
$ MIN0( jgl+KBL-1, N ) - jgl + 1 |
$ MIN( jgl+KBL-1, N ) - jgl + 1 |
IF( AAPP.LT.ZERO )NOTROT = 0 |
IF( AAPP.LT.ZERO )NOTROT = 0 |
END IF |
END IF |
|
|
Line 1012
|
Line 1012
|
* end of the jbc-loop |
* end of the jbc-loop |
2011 CONTINUE |
2011 CONTINUE |
*2011 bailed out of the jbc-loop |
*2011 bailed out of the jbc-loop |
DO 2012 p = igl, MIN0( igl+KBL-1, N ) |
DO 2012 p = igl, MIN( igl+KBL-1, N ) |
SVA( p ) = DABS( SVA( p ) ) |
SVA( p ) = DABS( SVA( p ) ) |
2012 CONTINUE |
2012 CONTINUE |
* |
* |