zlaqps.f (flens/lapack/interface/ref

  1       SUBROUTINE ZLAQPS( M, N, OFFSET, NB, KB, A, LDA, JPVT, TAU, VN1,

  2      $                   VN2, AUXV, F, LDF )

  3 *

  4 *  -- LAPACK auxiliary routine (version 3.3.1) --

  5 *  -- LAPACK is a software package provided by Univ. of Tennessee,    --

  6 *  -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--

  7 *  -- April 2011                                                      --

  8 *

  9 *     .. Scalar Arguments ..

 10       INTEGER            KB, LDA, LDF, M, N, NB, OFFSET

 11 *     ..

 12 *     .. Array Arguments ..

 13       INTEGER            JPVT( * )

 14       DOUBLE PRECISION   VN1( * ), VN2( * )

 15       COMPLEX*16         A( LDA, * ), AUXV( * ), F( LDF, * ), TAU( * )

 16 *     ..

 17 *

 18 *  Purpose

 19 *  =======

 20 *

 21 *  ZLAQPS computes a step of QR factorization with column pivoting

 22 *  of a complex M-by-N matrix A by using Blas-3.  It tries to factorize

 23 *  NB columns from A starting from the row OFFSET+1, and updates all

 24 *  of the matrix with Blas-3 xGEMM.

 25 *

 26 *  In some cases, due to catastrophic cancellations, it cannot

 27 *  factorize NB columns.  Hence, the actual number of factorized

 28 *  columns is returned in KB.

 29 *

 30 *  Block A(1:OFFSET,1:N) is accordingly pivoted, but not factorized.

 31 *

 32 *  Arguments

 33 *  =========

 34 *

 35 *  M       (input) INTEGER

 36 *          The number of rows of the matrix A. M >= 0.

 37 *

 38 *  N       (input) INTEGER

 39 *          The number of columns of the matrix A. N >= 0

 40 *

 41 *  OFFSET  (input) INTEGER

 42 *          The number of rows of A that have been factorized in

 43 *          previous steps.

 44 *

 45 *  NB      (input) INTEGER

 46 *          The number of columns to factorize.

 47 *

 48 *  KB      (output) INTEGER

 49 *          The number of columns actually factorized.

 50 *

 51 *  A       (input/output) COMPLEX*16 array, dimension (LDA,N)

 52 *          On entry, the M-by-N matrix A.

 53 *          On exit, block A(OFFSET+1:M,1:KB) is the triangular

 54 *          factor obtained and block A(1:OFFSET,1:N) has been

 55 *          accordingly pivoted, but no factorized.

 56 *          The rest of the matrix, block A(OFFSET+1:M,KB+1:N) has

 57 *          been updated.

 58 *

 59 *  LDA     (input) INTEGER

 60 *          The leading dimension of the array A. LDA >= max(1,M).

 61 *

 62 *  JPVT    (input/output) INTEGER array, dimension (N)

 63 *          JPVT(I) = K <==> Column K of the full matrix A has been

 64 *          permuted into position I in AP.

 65 *

 66 *  TAU     (output) COMPLEX*16 array, dimension (KB)

 67 *          The scalar factors of the elementary reflectors.

 68 *

 69 *  VN1     (input/output) DOUBLE PRECISION array, dimension (N)

 70 *          The vector with the partial column norms.

 71 *

 72 *  VN2     (input/output) DOUBLE PRECISION array, dimension (N)

 73 *          The vector with the exact column norms.

 74 *

 75 *  AUXV    (input/output) COMPLEX*16 array, dimension (NB)

 76 *          Auxiliar vector.

 77 *

 78 *  F       (input/output) COMPLEX*16 array, dimension (LDF,NB)

 79 *          Matrix F**H = L * Y**H * A.

 80 *

 81 *  LDF     (input) INTEGER

 82 *          The leading dimension of the array F. LDF >= max(1,N).

 83 *

 84 *  Further Details

 85 *  ===============

 86 *

 87 *  Based on contributions by

 88 *    G. Quintana-Orti, Depto. de Informatica, Universidad Jaime I, Spain

 89 *    X. Sun, Computer Science Dept., Duke University, USA

 90 *

 91 *  Partial column norm updating strategy modified by

 92 *    Z. Drmac and Z. Bujanovic, Dept. of Mathematics,

 93 *    University of Zagreb, Croatia.

 94 *  -- April 2011                                                      --

 95 *  For more details see LAPACK Working Note 176.

 96 *  =====================================================================

 97 *

 98 *     .. Parameters ..

 99       DOUBLE PRECISION   ZERO, ONE

100       COMPLEX*16         CZERO, CONE

101       PARAMETER          ( ZERO = 0.0D+0, ONE = 1.0D+0,

102      $                   CZERO = ( 0.0D+0, 0.0D+0 ),

103      $                   CONE = ( 1.0D+0, 0.0D+0 ) )

104 *     ..

105 *     .. Local Scalars ..

106       INTEGER            ITEMP, J, K, LASTRK, LSTICC, PVT, RK

107       DOUBLE PRECISION   TEMP, TEMP2, TOL3Z

108       COMPLEX*16         AKK

109 *     ..

110 *     .. External Subroutines ..

111       EXTERNAL           ZGEMM, ZGEMV, ZLARFG, ZSWAP

112 *     ..

113 *     .. Intrinsic Functions ..

114       INTRINSIC          ABS, DBLE, DCONJG, MAX, MIN, NINT, SQRT

115 *     ..

116 *     .. External Functions ..

117       INTEGER            IDAMAX

118       DOUBLE PRECISION   DLAMCH, DZNRM2

119       EXTERNAL           IDAMAX, DLAMCH, DZNRM2

120 *     ..

121 *     .. Executable Statements ..

122 *

123       LASTRK = MIN( M, N+OFFSET )

124       LSTICC = 0

125       K = 0

126       TOL3Z = SQRT(DLAMCH('Epsilon'))

127 *

128 *     Beginning of while loop.

129 *

130    10 CONTINUE

131       IF( ( K.LT.NB ) .AND. ( LSTICC.EQ.0 ) ) THEN

132          K = K + 1

133          RK = OFFSET + K

134 *

135 *        Determine ith pivot column and swap if necessary

136 *

137          PVT = ( K-1 ) + IDAMAX( N-K+1, VN1( K ), 1 )

138          IF( PVT.NE.K ) THEN

139             CALL ZSWAP( M, A( 1, PVT ), 1, A( 1, K ), 1 )

140             CALL ZSWAP( K-1, F( PVT, 1 ), LDF, F( K, 1 ), LDF )

141             ITEMP = JPVT( PVT )

142             JPVT( PVT ) = JPVT( K )

143             JPVT( K ) = ITEMP

144             VN1( PVT ) = VN1( K )

145             VN2( PVT ) = VN2( K )

146          END IF

147 *

148 *        Apply previous Householder reflectors to column K:

149 *        A(RK:M,K) := A(RK:M,K) - A(RK:M,1:K-1)*F(K,1:K-1)**H.

150 *

151          IF( K.GT.1 ) THEN

152             DO 20 J = 1, K - 1

153                F( K, J ) = DCONJG( F( K, J ) )

154    20       CONTINUE

155             CALL ZGEMV( 'No transpose', M-RK+1, K-1, -CONE, A( RK, 1 ),

156      $                  LDA, F( K, 1 ), LDF, CONE, A( RK, K ), 1 )

157             DO 30 J = 1, K - 1

158                F( K, J ) = DCONJG( F( K, J ) )

159    30       CONTINUE

160          END IF

161 *

162 *        Generate elementary reflector H(k).

163 *

164          IF( RK.LT.M ) THEN

165             CALL ZLARFG( M-RK+1, A( RK, K ), A( RK+1, K ), 1, TAU( K ) )

166          ELSE

167             CALL ZLARFG( 1, A( RK, K ), A( RK, K ), 1, TAU( K ) )

168          END IF

169 *

170          AKK = A( RK, K )

171          A( RK, K ) = CONE

172 *

173 *        Compute Kth column of F:

174 *

175 *        Compute  F(K+1:N,K) := tau(K)*A(RK:M,K+1:N)**H*A(RK:M,K).

176 *

177          IF( K.LT.N ) THEN

178             CALL ZGEMV( 'Conjugate transpose', M-RK+1, N-K, TAU( K ),

179      $                  A( RK, K+1 ), LDA, A( RK, K ), 1, CZERO,

180      $                  F( K+1, K ), 1 )

181          END IF

182 *

183 *        Padding F(1:K,K) with zeros.

184 *

185          DO 40 J = 1, K

186             F( J, K ) = CZERO

187    40    CONTINUE

188 *

189 *        Incremental updating of F:

190 *        F(1:N,K) := F(1:N,K) - tau(K)*F(1:N,1:K-1)*A(RK:M,1:K-1)**H

191 *                    *A(RK:M,K).

192 *

193          IF( K.GT.1 ) THEN

194             CALL ZGEMV( 'Conjugate transpose', M-RK+1, K-1, -TAU( K ),

195      $                  A( RK, 1 ), LDA, A( RK, K ), 1, CZERO,

196      $                  AUXV( 1 ), 1 )

197 *

198             CALL ZGEMV( 'No transpose', N, K-1, CONE, F( 1, 1 ), LDF,

199      $                  AUXV( 1 ), 1, CONE, F( 1, K ), 1 )

200          END IF

201 *

202 *        Update the current row of A:

203 *        A(RK,K+1:N) := A(RK,K+1:N) - A(RK,1:K)*F(K+1:N,1:K)**H.

204 *

205          IF( K.LT.N ) THEN

206             CALL ZGEMM( 'No transpose', 'Conjugate transpose', 1, N-K,

207      $                  K, -CONE, A( RK, 1 ), LDA, F( K+1, 1 ), LDF,

208      $                  CONE, A( RK, K+1 ), LDA )

209          END IF

210 *

211 *        Update partial column norms.

212 *

213          IF( RK.LT.LASTRK ) THEN

214             DO 50 J = K + 1, N

215                IF( VN1( J ).NE.ZERO ) THEN

216 *

217 *                 NOTE: The following 4 lines follow from the analysis in

218 *                 Lapack Working Note 176.

219 *

220                   TEMP = ABS( A( RK, J ) ) / VN1( J )

221                   TEMP = MAX( ZERO, ( ONE+TEMP )*( ONE-TEMP ) )

222                   TEMP2 = TEMP*( VN1( J ) / VN2( J ) )**2

223                   IF( TEMP2 .LE. TOL3Z ) THEN

224                      VN2( J ) = DBLE( LSTICC )

225                      LSTICC = J

226                   ELSE

227                      VN1( J ) = VN1( J )*SQRT( TEMP )

228                   END IF

229                END IF

230    50       CONTINUE

231          END IF

232 *

233          A( RK, K ) = AKK

234 *

235 *        End of while loop.

236 *

237          GO TO 10

238       END IF

239       KB = K

240       RK = OFFSET + KB

241 *

242 *     Apply the block reflector to the rest of the matrix:

243 *     A(OFFSET+KB+1:M,KB+1:N) := A(OFFSET+KB+1:M,KB+1:N) -

244 *                         A(OFFSET+KB+1:M,1:KB)*F(KB+1:N,1:KB)**H.

245 *

246       IF( KB.LT.MIN( N, M-OFFSET ) ) THEN

247          CALL ZGEMM( 'No transpose', 'Conjugate transpose', M-RK, N-KB,

248      $               KB, -CONE, A( RK+1, 1 ), LDA, F( KB+1, 1 ), LDF,

249      $               CONE, A( RK+1, KB+1 ), LDA )

250       END IF

251 *

252 *     Recomputation of difficult columns.

253 *

254    60 CONTINUE

255       IF( LSTICC.GT.0 ) THEN

256          ITEMP = NINT( VN2( LSTICC ) )

257          VN1( LSTICC ) = DZNRM2( M-RK, A( RK+1, LSTICC ), 1 )

258 *

259 *        NOTE: The computation of VN1( LSTICC ) relies on the fact that 

260 *        SNRM2 does not fail on vectors with norm below the value of

261 *        SQRT(DLAMCH('S')) 

262 *

263          VN2( LSTICC ) = VN1( LSTICC )

264          LSTICC = ITEMP

265          GO TO 60

266       END IF

267 *

268       RETURN

269 *

270 *     End of ZLAQPS

271 *

272       END