LAPACK 3.12.0
LAPACK: Linear Algebra PACKage
Loading...
Searching...
No Matches
cgelst.f
Go to the documentation of this file.
1*> \brief <b> CGELST solves overdetermined or underdetermined systems for GE matrices using QR or LQ factorization with compact WY representation of Q.</b>
2*
3* =========== DOCUMENTATION ===========
4*
5* Online html documentation available at
6* http://www.netlib.org/lapack/explore-html/
7*
8*> \htmlonly
9*> Download CGELST + dependencies
10*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/cgelst.f">
11*> [TGZ]</a>
12*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/cgelst.f">
13*> [ZIP]</a>
14*> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/cgelst.f">
15*> [TXT]</a>
16*> \endhtmlonly
17*
18* Definition:
19* ===========
20*
21* SUBROUTINE CGELST( TRANS, M, N, NRHS, A, LDA, B, LDB, WORK, LWORK,
22* INFO )
23*
24* .. Scalar Arguments ..
25* CHARACTER TRANS
26* INTEGER INFO, LDA, LDB, LWORK, M, N, NRHS
27* ..
28* .. Array Arguments ..
29* COMPLEX A( LDA, * ), B( LDB, * ), WORK( * )
30* ..
31*
32*
33*> \par Purpose:
34* =============
35*>
36*> \verbatim
37*>
38*> CGELST solves overdetermined or underdetermined real linear systems
39*> involving an M-by-N matrix A, or its conjugate-transpose, using a QR
40*> or LQ factorization of A with compact WY representation of Q.
41*> It is assumed that A has full rank.
42*>
43*> The following options are provided:
44*>
45*> 1. If TRANS = 'N' and m >= n: find the least squares solution of
46*> an overdetermined system, i.e., solve the least squares problem
47*> minimize || B - A*X ||.
48*>
49*> 2. If TRANS = 'N' and m < n: find the minimum norm solution of
50*> an underdetermined system A * X = B.
51*>
52*> 3. If TRANS = 'C' and m >= n: find the minimum norm solution of
53*> an underdetermined system A**T * X = B.
54*>
55*> 4. If TRANS = 'C' and m < n: find the least squares solution of
56*> an overdetermined system, i.e., solve the least squares problem
57*> minimize || B - A**T * X ||.
58*>
59*> Several right hand side vectors b and solution vectors x can be
60*> handled in a single call; they are stored as the columns of the
61*> M-by-NRHS right hand side matrix B and the N-by-NRHS solution
62*> matrix X.
63*> \endverbatim
64*
65* Arguments:
66* ==========
67*
68*> \param[in] TRANS
69*> \verbatim
70*> TRANS is CHARACTER*1
71*> = 'N': the linear system involves A;
72*> = 'C': the linear system involves A**H.
73*> \endverbatim
74*>
75*> \param[in] M
76*> \verbatim
77*> M is INTEGER
78*> The number of rows of the matrix A. M >= 0.
79*> \endverbatim
80*>
81*> \param[in] N
82*> \verbatim
83*> N is INTEGER
84*> The number of columns of the matrix A. N >= 0.
85*> \endverbatim
86*>
87*> \param[in] NRHS
88*> \verbatim
89*> NRHS is INTEGER
90*> The number of right hand sides, i.e., the number of
91*> columns of the matrices B and X. NRHS >=0.
92*> \endverbatim
93*>
94*> \param[in,out] A
95*> \verbatim
96*> A is COMPLEX array, dimension (LDA,N)
97*> On entry, the M-by-N matrix A.
98*> On exit,
99*> if M >= N, A is overwritten by details of its QR
100*> factorization as returned by CGEQRT;
101*> if M < N, A is overwritten by details of its LQ
102*> factorization as returned by CGELQT.
103*> \endverbatim
104*>
105*> \param[in] LDA
106*> \verbatim
107*> LDA is INTEGER
108*> The leading dimension of the array A. LDA >= max(1,M).
109*> \endverbatim
110*>
111*> \param[in,out] B
112*> \verbatim
113*> B is COMPLEX array, dimension (LDB,NRHS)
114*> On entry, the matrix B of right hand side vectors, stored
115*> columnwise; B is M-by-NRHS if TRANS = 'N', or N-by-NRHS
116*> if TRANS = 'C'.
117*> On exit, if INFO = 0, B is overwritten by the solution
118*> vectors, stored columnwise:
119*> if TRANS = 'N' and m >= n, rows 1 to n of B contain the least
120*> squares solution vectors; the residual sum of squares for the
121*> solution in each column is given by the sum of squares of
122*> modulus of elements N+1 to M in that column;
123*> if TRANS = 'N' and m < n, rows 1 to N of B contain the
124*> minimum norm solution vectors;
125*> if TRANS = 'C' and m >= n, rows 1 to M of B contain the
126*> minimum norm solution vectors;
127*> if TRANS = 'C' and m < n, rows 1 to M of B contain the
128*> least squares solution vectors; the residual sum of squares
129*> for the solution in each column is given by the sum of
130*> squares of the modulus of elements M+1 to N in that column.
131*> \endverbatim
132*>
133*> \param[in] LDB
134*> \verbatim
135*> LDB is INTEGER
136*> The leading dimension of the array B. LDB >= MAX(1,M,N).
137*> \endverbatim
138*>
139*> \param[out] WORK
140*> \verbatim
141*> WORK is COMPLEX array, dimension (MAX(1,LWORK))
142*> On exit, if INFO = 0, WORK(1) returns the optimal LWORK.
143*> \endverbatim
144*>
145*> \param[in] LWORK
146*> \verbatim
147*> LWORK is INTEGER
148*> The dimension of the array WORK.
149*> LWORK >= max( 1, MN + max( MN, NRHS ) ).
150*> For optimal performance,
151*> LWORK >= max( 1, (MN + max( MN, NRHS ))*NB ).
152*> where MN = min(M,N) and NB is the optimum block size.
153*>
154*> If LWORK = -1, then a workspace query is assumed; the routine
155*> only calculates the optimal size of the WORK array, returns
156*> this value as the first entry of the WORK array, and no error
157*> message related to LWORK is issued by XERBLA.
158*> \endverbatim
159*>
160*> \param[out] INFO
161*> \verbatim
162*> INFO is INTEGER
163*> = 0: successful exit
164*> < 0: if INFO = -i, the i-th argument had an illegal value
165*> > 0: if INFO = i, the i-th diagonal element of the
166*> triangular factor of A is zero, so that A does not have
167*> full rank; the least squares solution could not be
168*> computed.
169*> \endverbatim
170*
171* Authors:
172* ========
173*
174*> \author Univ. of Tennessee
175*> \author Univ. of California Berkeley
176*> \author Univ. of Colorado Denver
177*> \author NAG Ltd.
178*
179*> \ingroup gelst
180*
181*> \par Contributors:
182* ==================
183*>
184*> \verbatim
185*>
186*> November 2022, Igor Kozachenko,
187*> Computer Science Division,
188*> University of California, Berkeley
189*> \endverbatim
190*
191* =====================================================================
192 SUBROUTINE cgelst( TRANS, M, N, NRHS, A, LDA, B, LDB, WORK, LWORK,
193 $ INFO )
194*
195* -- LAPACK driver routine --
196* -- LAPACK is a software package provided by Univ. of Tennessee, --
197* -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
198*
199* .. Scalar Arguments ..
200 CHARACTER TRANS
201 INTEGER INFO, LDA, LDB, LWORK, M, N, NRHS
202* ..
203* .. Array Arguments ..
204 COMPLEX A( LDA, * ), B( LDB, * ), WORK( * )
205* ..
206*
207* =====================================================================
208*
209* .. Parameters ..
210 REAL ZERO, ONE
211 parameter( zero = 0.0e+0, one = 1.0e+0 )
212 COMPLEX CZERO
213 parameter( czero = ( 0.0e+0, 0.0e+0 ) )
214* ..
215* .. Local Scalars ..
216 LOGICAL LQUERY, TPSD
217 INTEGER BROW, I, IASCL, IBSCL, J, LWOPT, MN, MNNRHS,
218 $ nb, nbmin, scllen
219 REAL ANRM, BIGNUM, BNRM, SMLNUM
220* ..
221* .. Local Arrays ..
222 REAL RWORK( 1 )
223* ..
224* .. External Functions ..
225 LOGICAL LSAME
226 INTEGER ILAENV
227 REAL SLAMCH, CLANGE, SROUNDUP_LWORK
228 EXTERNAL lsame, ilaenv, slamch, clange, sroundup_lwork
229* ..
230* .. External Subroutines ..
231 EXTERNAL cgelqt, cgeqrt, cgemlqt, cgemqrt,
233* ..
234* .. Intrinsic Functions ..
235 INTRINSIC max, min
236* ..
237* .. Executable Statements ..
238*
239* Test the input arguments.
240*
241 info = 0
242 mn = min( m, n )
243 lquery = ( lwork.EQ.-1 )
244 IF( .NOT.( lsame( trans, 'N' ) .OR. lsame( trans, 'C' ) ) ) THEN
245 info = -1
246 ELSE IF( m.LT.0 ) THEN
247 info = -2
248 ELSE IF( n.LT.0 ) THEN
249 info = -3
250 ELSE IF( nrhs.LT.0 ) THEN
251 info = -4
252 ELSE IF( lda.LT.max( 1, m ) ) THEN
253 info = -6
254 ELSE IF( ldb.LT.max( 1, m, n ) ) THEN
255 info = -8
256 ELSE IF( lwork.LT.max( 1, mn+max( mn, nrhs ) ) .AND. .NOT.lquery )
257 $ THEN
258 info = -10
259 END IF
260*
261* Figure out optimal block size and optimal workspace size
262*
263 IF( info.EQ.0 .OR. info.EQ.-10 ) THEN
264*
265 tpsd = .true.
266 IF( lsame( trans, 'N' ) )
267 $ tpsd = .false.
268*
269 nb = ilaenv( 1, 'CGELST', ' ', m, n, -1, -1 )
270*
271 mnnrhs = max( mn, nrhs )
272 lwopt = max( 1, (mn+mnnrhs)*nb )
273 work( 1 ) = sroundup_lwork( lwopt )
274*
275 END IF
276*
277 IF( info.NE.0 ) THEN
278 CALL xerbla( 'CGELST ', -info )
279 RETURN
280 ELSE IF( lquery ) THEN
281 RETURN
282 END IF
283*
284* Quick return if possible
285*
286 IF( min( m, n, nrhs ).EQ.0 ) THEN
287 CALL claset( 'Full', max( m, n ), nrhs, czero, czero, b, ldb )
288 work( 1 ) = sroundup_lwork( lwopt )
289 RETURN
290 END IF
291*
292* *GEQRT and *GELQT routines cannot accept NB larger than min(M,N)
293*
294 IF( nb.GT.mn ) nb = mn
295*
296* Determine the block size from the supplied LWORK
297* ( at this stage we know that LWORK >= (minimum required workspace,
298* but it may be less than optimal)
299*
300 nb = min( nb, lwork/( mn + mnnrhs ) )
301*
302* The minimum value of NB, when blocked code is used
303*
304 nbmin = max( 2, ilaenv( 2, 'CGELST', ' ', m, n, -1, -1 ) )
305*
306 IF( nb.LT.nbmin ) THEN
307 nb = 1
308 END IF
309*
310* Get machine parameters
311*
312 smlnum = slamch( 'S' ) / slamch( 'P' )
313 bignum = one / smlnum
314*
315* Scale A, B if max element outside range [SMLNUM,BIGNUM]
316*
317 anrm = clange( 'M', m, n, a, lda, rwork )
318 iascl = 0
319 IF( anrm.GT.zero .AND. anrm.LT.smlnum ) THEN
320*
321* Scale matrix norm up to SMLNUM
322*
323 CALL clascl( 'G', 0, 0, anrm, smlnum, m, n, a, lda, info )
324 iascl = 1
325 ELSE IF( anrm.GT.bignum ) THEN
326*
327* Scale matrix norm down to BIGNUM
328*
329 CALL clascl( 'G', 0, 0, anrm, bignum, m, n, a, lda, info )
330 iascl = 2
331 ELSE IF( anrm.EQ.zero ) THEN
332*
333* Matrix all zero. Return zero solution.
334*
335 CALL claset( 'Full', max( m, n ), nrhs, czero, czero, b, ldb )
336 work( 1 ) = sroundup_lwork( lwopt )
337 RETURN
338 END IF
339*
340 brow = m
341 IF( tpsd )
342 $ brow = n
343 bnrm = clange( 'M', brow, nrhs, b, ldb, rwork )
344 ibscl = 0
345 IF( bnrm.GT.zero .AND. bnrm.LT.smlnum ) THEN
346*
347* Scale matrix norm up to SMLNUM
348*
349 CALL clascl( 'G', 0, 0, bnrm, smlnum, brow, nrhs, b, ldb,
350 $ info )
351 ibscl = 1
352 ELSE IF( bnrm.GT.bignum ) THEN
353*
354* Scale matrix norm down to BIGNUM
355*
356 CALL clascl( 'G', 0, 0, bnrm, bignum, brow, nrhs, b, ldb,
357 $ info )
358 ibscl = 2
359 END IF
360*
361 IF( m.GE.n ) THEN
362*
363* M > N:
364* Compute the blocked QR factorization of A,
365* using the compact WY representation of Q,
366* workspace at least N, optimally N*NB.
367*
368 CALL cgeqrt( m, n, nb, a, lda, work( 1 ), nb,
369 $ work( mn*nb+1 ), info )
370*
371 IF( .NOT.tpsd ) THEN
372*
373* M > N, A is not transposed:
374* Overdetermined system of equations,
375* least-squares problem, min || A * X - B ||.
376*
377* Compute B(1:M,1:NRHS) := Q**T * B(1:M,1:NRHS),
378* using the compact WY representation of Q,
379* workspace at least NRHS, optimally NRHS*NB.
380*
381 CALL cgemqrt( 'Left', 'Conjugate transpose', m, nrhs, n, nb,
382 $ a, lda, work( 1 ), nb, b, ldb,
383 $ work( mn*nb+1 ), info )
384*
385* Compute B(1:N,1:NRHS) := inv(R) * B(1:N,1:NRHS)
386*
387 CALL ctrtrs( 'Upper', 'No transpose', 'Non-unit', n, nrhs,
388 $ a, lda, b, ldb, info )
389*
390 IF( info.GT.0 ) THEN
391 RETURN
392 END IF
393*
394 scllen = n
395*
396 ELSE
397*
398* M > N, A is transposed:
399* Underdetermined system of equations,
400* minimum norm solution of A**T * X = B.
401*
402* Compute B := inv(R**T) * B in two row blocks of B.
403*
404* Block 1: B(1:N,1:NRHS) := inv(R**T) * B(1:N,1:NRHS)
405*
406 CALL ctrtrs( 'Upper', 'Conjugate transpose', 'Non-unit',
407 $ n, nrhs, a, lda, b, ldb, info )
408*
409 IF( info.GT.0 ) THEN
410 RETURN
411 END IF
412*
413* Block 2: Zero out all rows below the N-th row in B:
414* B(N+1:M,1:NRHS) = ZERO
415*
416 DO j = 1, nrhs
417 DO i = n + 1, m
418 b( i, j ) = zero
419 END DO
420 END DO
421*
422* Compute B(1:M,1:NRHS) := Q(1:N,:) * B(1:N,1:NRHS),
423* using the compact WY representation of Q,
424* workspace at least NRHS, optimally NRHS*NB.
425*
426 CALL cgemqrt( 'Left', 'No transpose', m, nrhs, n, nb,
427 $ a, lda, work( 1 ), nb, b, ldb,
428 $ work( mn*nb+1 ), info )
429*
430 scllen = m
431*
432 END IF
433*
434 ELSE
435*
436* M < N:
437* Compute the blocked LQ factorization of A,
438* using the compact WY representation of Q,
439* workspace at least M, optimally M*NB.
440*
441 CALL cgelqt( m, n, nb, a, lda, work( 1 ), nb,
442 $ work( mn*nb+1 ), info )
443*
444 IF( .NOT.tpsd ) THEN
445*
446* M < N, A is not transposed:
447* Underdetermined system of equations,
448* minimum norm solution of A * X = B.
449*
450* Compute B := inv(L) * B in two row blocks of B.
451*
452* Block 1: B(1:M,1:NRHS) := inv(L) * B(1:M,1:NRHS)
453*
454 CALL ctrtrs( 'Lower', 'No transpose', 'Non-unit', m, nrhs,
455 $ a, lda, b, ldb, info )
456*
457 IF( info.GT.0 ) THEN
458 RETURN
459 END IF
460*
461* Block 2: Zero out all rows below the M-th row in B:
462* B(M+1:N,1:NRHS) = ZERO
463*
464 DO j = 1, nrhs
465 DO i = m + 1, n
466 b( i, j ) = zero
467 END DO
468 END DO
469*
470* Compute B(1:N,1:NRHS) := Q(1:N,:)**T * B(1:M,1:NRHS),
471* using the compact WY representation of Q,
472* workspace at least NRHS, optimally NRHS*NB.
473*
474 CALL cgemlqt( 'Left', 'Conjugate transpose', n, nrhs, m, nb,
475 $ a, lda, work( 1 ), nb, b, ldb,
476 $ work( mn*nb+1 ), info )
477*
478 scllen = n
479*
480 ELSE
481*
482* M < N, A is transposed:
483* Overdetermined system of equations,
484* least-squares problem, min || A**T * X - B ||.
485*
486* Compute B(1:N,1:NRHS) := Q * B(1:N,1:NRHS),
487* using the compact WY representation of Q,
488* workspace at least NRHS, optimally NRHS*NB.
489*
490 CALL cgemlqt( 'Left', 'No transpose', n, nrhs, m, nb,
491 $ a, lda, work( 1 ), nb, b, ldb,
492 $ work( mn*nb+1), info )
493*
494* Compute B(1:M,1:NRHS) := inv(L**T) * B(1:M,1:NRHS)
495*
496 CALL ctrtrs( 'Lower', 'Conjugate transpose', 'Non-unit',
497 $ m, nrhs, a, lda, b, ldb, info )
498*
499 IF( info.GT.0 ) THEN
500 RETURN
501 END IF
502*
503 scllen = m
504*
505 END IF
506*
507 END IF
508*
509* Undo scaling
510*
511 IF( iascl.EQ.1 ) THEN
512 CALL clascl( 'G', 0, 0, anrm, smlnum, scllen, nrhs, b, ldb,
513 $ info )
514 ELSE IF( iascl.EQ.2 ) THEN
515 CALL clascl( 'G', 0, 0, anrm, bignum, scllen, nrhs, b, ldb,
516 $ info )
517 END IF
518 IF( ibscl.EQ.1 ) THEN
519 CALL clascl( 'G', 0, 0, smlnum, bnrm, scllen, nrhs, b, ldb,
520 $ info )
521 ELSE IF( ibscl.EQ.2 ) THEN
522 CALL clascl( 'G', 0, 0, bignum, bnrm, scllen, nrhs, b, ldb,
523 $ info )
524 END IF
525*
526 work( 1 ) = sroundup_lwork( lwopt )
527*
528 RETURN
529*
530* End of CGELST
531*
532 END
subroutine xerbla(srname, info)
Definition cblat2.f:3285
subroutine cgelqt(m, n, mb, a, lda, t, ldt, work, info)
CGELQT
Definition cgelqt.f:124
subroutine cgelst(trans, m, n, nrhs, a, lda, b, ldb, work, lwork, info)
CGELST solves overdetermined or underdetermined systems for GE matrices using QR or LQ factorization ...
Definition cgelst.f:194
subroutine cgemlqt(side, trans, m, n, k, mb, v, ldv, t, ldt, c, ldc, work, info)
CGEMLQT
Definition cgemlqt.f:153
subroutine cgemqrt(side, trans, m, n, k, nb, v, ldv, t, ldt, c, ldc, work, info)
CGEMQRT
Definition cgemqrt.f:168
subroutine cgeqrt(m, n, nb, a, lda, t, ldt, work, info)
CGEQRT
Definition cgeqrt.f:141
subroutine clascl(type, kl, ku, cfrom, cto, m, n, a, lda, info)
CLASCL multiplies a general rectangular matrix by a real scalar defined as cto/cfrom.
Definition clascl.f:143
subroutine claset(uplo, m, n, alpha, beta, a, lda)
CLASET initializes the off-diagonal elements and the diagonal elements of a matrix to given values.
Definition claset.f:106
subroutine ctrtrs(uplo, trans, diag, n, nrhs, a, lda, b, ldb, info)
CTRTRS
Definition ctrtrs.f:140