version 1.11, 2012/08/22 09:48:19
|
version 1.12, 2012/12/14 12:30:24
|
Line 1
|
Line 1
|
*> \brief \b DLARFB |
*> \brief \b DLARFB applies a block reflector or its transpose to a general rectangular matrix. |
* |
* |
* =========== DOCUMENTATION =========== |
* =========== DOCUMENTATION =========== |
* |
* |
Line 159
|
Line 159
|
*> \author Univ. of Colorado Denver |
*> \author Univ. of Colorado Denver |
*> \author NAG Ltd. |
*> \author NAG Ltd. |
* |
* |
*> \date November 2011 |
*> \date September 2012 |
* |
* |
*> \ingroup doubleOTHERauxiliary |
*> \ingroup doubleOTHERauxiliary |
* |
* |
Line 195
|
Line 195
|
SUBROUTINE DLARFB( SIDE, TRANS, DIRECT, STOREV, M, N, K, V, LDV, |
SUBROUTINE DLARFB( SIDE, TRANS, DIRECT, STOREV, M, N, K, V, LDV, |
$ T, LDT, C, LDC, WORK, LDWORK ) |
$ T, LDT, C, LDC, WORK, LDWORK ) |
* |
* |
* -- LAPACK auxiliary routine (version 3.4.0) -- |
* -- LAPACK auxiliary routine (version 3.4.2) -- |
* -- LAPACK is a software package provided by Univ. of Tennessee, -- |
* -- LAPACK is a software package provided by Univ. of Tennessee, -- |
* -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..-- |
* -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..-- |
* November 2011 |
* September 2012 |
* |
* |
* .. Scalar Arguments .. |
* .. Scalar Arguments .. |
CHARACTER DIRECT, SIDE, STOREV, TRANS |
CHARACTER DIRECT, SIDE, STOREV, TRANS |
Line 217
|
Line 217
|
* .. |
* .. |
* .. Local Scalars .. |
* .. Local Scalars .. |
CHARACTER TRANST |
CHARACTER TRANST |
INTEGER I, J, LASTV, LASTC |
INTEGER I, J, LASTV, LASTC, lastv2 |
* .. |
* .. |
* .. External Functions .. |
* .. External Functions .. |
LOGICAL LSAME |
LOGICAL LSAME |
Line 379
|
Line 379
|
* Form H * C or H**T * C where C = ( C1 ) |
* Form H * C or H**T * C where C = ( C1 ) |
* ( C2 ) |
* ( C2 ) |
* |
* |
LASTV = MAX( K, ILADLR( M, K, V, LDV ) ) |
LASTC = ILADLC( M, N, C, LDC ) |
LASTC = ILADLC( LASTV, N, C, LDC ) |
|
* |
* |
* W := C**T * V = (C1**T * V1 + C2**T * V2) (stored in WORK) |
* W := C**T * V = (C1**T * V1 + C2**T * V2) (stored in WORK) |
* |
* |
* W := C2**T |
* W := C2**T |
* |
* |
DO 70 J = 1, K |
DO 70 J = 1, K |
CALL DCOPY( LASTC, C( LASTV-K+J, 1 ), LDC, |
CALL DCOPY( LASTC, C( M-K+J, 1 ), LDC, |
$ WORK( 1, J ), 1 ) |
$ WORK( 1, J ), 1 ) |
70 CONTINUE |
70 CONTINUE |
* |
* |
* W := W * V2 |
* W := W * V2 |
* |
* |
CALL DTRMM( 'Right', 'Upper', 'No transpose', 'Unit', |
CALL DTRMM( 'Right', 'Upper', 'No transpose', 'Unit', |
$ LASTC, K, ONE, V( LASTV-K+1, 1 ), LDV, |
$ LASTC, K, ONE, V( M-K+1, 1 ), LDV, |
$ WORK, LDWORK ) |
$ WORK, LDWORK ) |
IF( LASTV.GT.K ) THEN |
IF( M.GT.K ) THEN |
* |
* |
* W := W + C1**T*V1 |
* W := W + C1**T*V1 |
* |
* |
CALL DGEMM( 'Transpose', 'No transpose', |
CALL DGEMM( 'Transpose', 'No transpose', |
$ LASTC, K, LASTV-K, ONE, C, LDC, V, LDV, |
$ LASTC, K, M-K, ONE, C, LDC, V, LDV, |
$ ONE, WORK, LDWORK ) |
$ ONE, WORK, LDWORK ) |
END IF |
END IF |
* |
* |
Line 412
|
Line 411
|
* |
* |
* C := C - V * W**T |
* C := C - V * W**T |
* |
* |
IF( LASTV.GT.K ) THEN |
IF( M.GT.K ) THEN |
* |
* |
* C1 := C1 - V1 * W**T |
* C1 := C1 - V1 * W**T |
* |
* |
CALL DGEMM( 'No transpose', 'Transpose', |
CALL DGEMM( 'No transpose', 'Transpose', |
$ LASTV-K, LASTC, K, -ONE, V, LDV, WORK, LDWORK, |
$ M-K, LASTC, K, -ONE, V, LDV, WORK, LDWORK, |
$ ONE, C, LDC ) |
$ ONE, C, LDC ) |
END IF |
END IF |
* |
* |
* W := W * V2**T |
* W := W * V2**T |
* |
* |
CALL DTRMM( 'Right', 'Upper', 'Transpose', 'Unit', |
CALL DTRMM( 'Right', 'Upper', 'Transpose', 'Unit', |
$ LASTC, K, ONE, V( LASTV-K+1, 1 ), LDV, |
$ LASTC, K, ONE, V( M-K+1, 1 ), LDV, |
$ WORK, LDWORK ) |
$ WORK, LDWORK ) |
* |
* |
* C2 := C2 - W**T |
* C2 := C2 - W**T |
* |
* |
DO 90 J = 1, K |
DO 90 J = 1, K |
DO 80 I = 1, LASTC |
DO 80 I = 1, LASTC |
C( LASTV-K+J, I ) = C( LASTV-K+J, I ) - WORK(I, J) |
C( M-K+J, I ) = C( M-K+J, I ) - WORK(I, J) |
80 CONTINUE |
80 CONTINUE |
90 CONTINUE |
90 CONTINUE |
* |
* |
Line 439
|
Line 438
|
* |
* |
* Form C * H or C * H**T where C = ( C1 C2 ) |
* Form C * H or C * H**T where C = ( C1 C2 ) |
* |
* |
LASTV = MAX( K, ILADLR( N, K, V, LDV ) ) |
LASTC = ILADLR( M, N, C, LDC ) |
LASTC = ILADLR( M, LASTV, C, LDC ) |
|
* |
* |
* W := C * V = (C1*V1 + C2*V2) (stored in WORK) |
* W := C * V = (C1*V1 + C2*V2) (stored in WORK) |
* |
* |
Line 453
|
Line 451
|
* W := W * V2 |
* W := W * V2 |
* |
* |
CALL DTRMM( 'Right', 'Upper', 'No transpose', 'Unit', |
CALL DTRMM( 'Right', 'Upper', 'No transpose', 'Unit', |
$ LASTC, K, ONE, V( LASTV-K+1, 1 ), LDV, |
$ LASTC, K, ONE, V( N-K+1, 1 ), LDV, |
$ WORK, LDWORK ) |
$ WORK, LDWORK ) |
IF( LASTV.GT.K ) THEN |
IF( N.GT.K ) THEN |
* |
* |
* W := W + C1 * V1 |
* W := W + C1 * V1 |
* |
* |
CALL DGEMM( 'No transpose', 'No transpose', |
CALL DGEMM( 'No transpose', 'No transpose', |
$ LASTC, K, LASTV-K, ONE, C, LDC, V, LDV, |
$ LASTC, K, N-K, ONE, C, LDC, V, LDV, |
$ ONE, WORK, LDWORK ) |
$ ONE, WORK, LDWORK ) |
END IF |
END IF |
* |
* |
Line 471
|
Line 469
|
* |
* |
* C := C - W * V**T |
* C := C - W * V**T |
* |
* |
IF( LASTV.GT.K ) THEN |
IF( N.GT.K ) THEN |
* |
* |
* C1 := C1 - W * V1**T |
* C1 := C1 - W * V1**T |
* |
* |
CALL DGEMM( 'No transpose', 'Transpose', |
CALL DGEMM( 'No transpose', 'Transpose', |
$ LASTC, LASTV-K, K, -ONE, WORK, LDWORK, V, LDV, |
$ LASTC, N-K, K, -ONE, WORK, LDWORK, V, LDV, |
$ ONE, C, LDC ) |
$ ONE, C, LDC ) |
END IF |
END IF |
* |
* |
* W := W * V2**T |
* W := W * V2**T |
* |
* |
CALL DTRMM( 'Right', 'Upper', 'Transpose', 'Unit', |
CALL DTRMM( 'Right', 'Upper', 'Transpose', 'Unit', |
$ LASTC, K, ONE, V( LASTV-K+1, 1 ), LDV, |
$ LASTC, K, ONE, V( N-K+1, 1 ), LDV, |
$ WORK, LDWORK ) |
$ WORK, LDWORK ) |
* |
* |
* C2 := C2 - W |
* C2 := C2 - W |
* |
* |
DO 120 J = 1, K |
DO 120 J = 1, K |
DO 110 I = 1, LASTC |
DO 110 I = 1, LASTC |
C( I, LASTV-K+J ) = C( I, LASTV-K+J ) - WORK(I, J) |
C( I, N-K+J ) = C( I, N-K+J ) - WORK(I, J) |
110 CONTINUE |
110 CONTINUE |
120 CONTINUE |
120 CONTINUE |
END IF |
END IF |
Line 634
|
Line 632
|
* Form H * C or H**T * C where C = ( C1 ) |
* Form H * C or H**T * C where C = ( C1 ) |
* ( C2 ) |
* ( C2 ) |
* |
* |
LASTV = MAX( K, ILADLC( K, M, V, LDV ) ) |
LASTC = ILADLC( M, N, C, LDC ) |
LASTC = ILADLC( LASTV, N, C, LDC ) |
|
* |
* |
* W := C**T * V**T = (C1**T * V1**T + C2**T * V2**T) (stored in WORK) |
* W := C**T * V**T = (C1**T * V1**T + C2**T * V2**T) (stored in WORK) |
* |
* |
* W := C2**T |
* W := C2**T |
* |
* |
DO 190 J = 1, K |
DO 190 J = 1, K |
CALL DCOPY( LASTC, C( LASTV-K+J, 1 ), LDC, |
CALL DCOPY( LASTC, C( M-K+J, 1 ), LDC, |
$ WORK( 1, J ), 1 ) |
$ WORK( 1, J ), 1 ) |
190 CONTINUE |
190 CONTINUE |
* |
* |
* W := W * V2**T |
* W := W * V2**T |
* |
* |
CALL DTRMM( 'Right', 'Lower', 'Transpose', 'Unit', |
CALL DTRMM( 'Right', 'Lower', 'Transpose', 'Unit', |
$ LASTC, K, ONE, V( 1, LASTV-K+1 ), LDV, |
$ LASTC, K, ONE, V( 1, M-K+1 ), LDV, |
$ WORK, LDWORK ) |
$ WORK, LDWORK ) |
IF( LASTV.GT.K ) THEN |
IF( M.GT.K ) THEN |
* |
* |
* W := W + C1**T * V1**T |
* W := W + C1**T * V1**T |
* |
* |
CALL DGEMM( 'Transpose', 'Transpose', |
CALL DGEMM( 'Transpose', 'Transpose', |
$ LASTC, K, LASTV-K, ONE, C, LDC, V, LDV, |
$ LASTC, K, M-K, ONE, C, LDC, V, LDV, |
$ ONE, WORK, LDWORK ) |
$ ONE, WORK, LDWORK ) |
END IF |
END IF |
* |
* |
Line 667
|
Line 664
|
* |
* |
* C := C - V**T * W**T |
* C := C - V**T * W**T |
* |
* |
IF( LASTV.GT.K ) THEN |
IF( M.GT.K ) THEN |
* |
* |
* C1 := C1 - V1**T * W**T |
* C1 := C1 - V1**T * W**T |
* |
* |
CALL DGEMM( 'Transpose', 'Transpose', |
CALL DGEMM( 'Transpose', 'Transpose', |
$ LASTV-K, LASTC, K, -ONE, V, LDV, WORK, LDWORK, |
$ M-K, LASTC, K, -ONE, V, LDV, WORK, LDWORK, |
$ ONE, C, LDC ) |
$ ONE, C, LDC ) |
END IF |
END IF |
* |
* |
* W := W * V2 |
* W := W * V2 |
* |
* |
CALL DTRMM( 'Right', 'Lower', 'No transpose', 'Unit', |
CALL DTRMM( 'Right', 'Lower', 'No transpose', 'Unit', |
$ LASTC, K, ONE, V( 1, LASTV-K+1 ), LDV, |
$ LASTC, K, ONE, V( 1, M-K+1 ), LDV, |
$ WORK, LDWORK ) |
$ WORK, LDWORK ) |
* |
* |
* C2 := C2 - W**T |
* C2 := C2 - W**T |
* |
* |
DO 210 J = 1, K |
DO 210 J = 1, K |
DO 200 I = 1, LASTC |
DO 200 I = 1, LASTC |
C( LASTV-K+J, I ) = C( LASTV-K+J, I ) - WORK(I, J) |
C( M-K+J, I ) = C( M-K+J, I ) - WORK(I, J) |
200 CONTINUE |
200 CONTINUE |
210 CONTINUE |
210 CONTINUE |
* |
* |
Line 694
|
Line 691
|
* |
* |
* Form C * H or C * H**T where C = ( C1 C2 ) |
* Form C * H or C * H**T where C = ( C1 C2 ) |
* |
* |
LASTV = MAX( K, ILADLC( K, N, V, LDV ) ) |
LASTC = ILADLR( M, N, C, LDC ) |
LASTC = ILADLR( M, LASTV, C, LDC ) |
|
* |
* |
* W := C * V**T = (C1*V1**T + C2*V2**T) (stored in WORK) |
* W := C * V**T = (C1*V1**T + C2*V2**T) (stored in WORK) |
* |
* |
* W := C2 |
* W := C2 |
* |
* |
DO 220 J = 1, K |
DO 220 J = 1, K |
CALL DCOPY( LASTC, C( 1, LASTV-K+J ), 1, |
CALL DCOPY( LASTC, C( 1, N-K+J ), 1, |
$ WORK( 1, J ), 1 ) |
$ WORK( 1, J ), 1 ) |
220 CONTINUE |
220 CONTINUE |
* |
* |
* W := W * V2**T |
* W := W * V2**T |
* |
* |
CALL DTRMM( 'Right', 'Lower', 'Transpose', 'Unit', |
CALL DTRMM( 'Right', 'Lower', 'Transpose', 'Unit', |
$ LASTC, K, ONE, V( 1, LASTV-K+1 ), LDV, |
$ LASTC, K, ONE, V( 1, N-K+1 ), LDV, |
$ WORK, LDWORK ) |
$ WORK, LDWORK ) |
IF( LASTV.GT.K ) THEN |
IF( N.GT.K ) THEN |
* |
* |
* W := W + C1 * V1**T |
* W := W + C1 * V1**T |
* |
* |
CALL DGEMM( 'No transpose', 'Transpose', |
CALL DGEMM( 'No transpose', 'Transpose', |
$ LASTC, K, LASTV-K, ONE, C, LDC, V, LDV, |
$ LASTC, K, N-K, ONE, C, LDC, V, LDV, |
$ ONE, WORK, LDWORK ) |
$ ONE, WORK, LDWORK ) |
END IF |
END IF |
* |
* |
Line 727
|
Line 723
|
* |
* |
* C := C - W * V |
* C := C - W * V |
* |
* |
IF( LASTV.GT.K ) THEN |
IF( N.GT.K ) THEN |
* |
* |
* C1 := C1 - W * V1 |
* C1 := C1 - W * V1 |
* |
* |
CALL DGEMM( 'No transpose', 'No transpose', |
CALL DGEMM( 'No transpose', 'No transpose', |
$ LASTC, LASTV-K, K, -ONE, WORK, LDWORK, V, LDV, |
$ LASTC, N-K, K, -ONE, WORK, LDWORK, V, LDV, |
$ ONE, C, LDC ) |
$ ONE, C, LDC ) |
END IF |
END IF |
* |
* |
* W := W * V2 |
* W := W * V2 |
* |
* |
CALL DTRMM( 'Right', 'Lower', 'No transpose', 'Unit', |
CALL DTRMM( 'Right', 'Lower', 'No transpose', 'Unit', |
$ LASTC, K, ONE, V( 1, LASTV-K+1 ), LDV, |
$ LASTC, K, ONE, V( 1, N-K+1 ), LDV, |
$ WORK, LDWORK ) |
$ WORK, LDWORK ) |
* |
* |
* C1 := C1 - W |
* C1 := C1 - W |
* |
* |
DO 240 J = 1, K |
DO 240 J = 1, K |
DO 230 I = 1, LASTC |
DO 230 I = 1, LASTC |
C( I, LASTV-K+J ) = C( I, LASTV-K+J ) - WORK(I, J) |
C( I, N-K+J ) = C( I, N-K+J ) - WORK(I, J) |
230 CONTINUE |
230 CONTINUE |
240 CONTINUE |
240 CONTINUE |
* |
* |