You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

sgelst.f 16 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530
  1. *> \brief <b> SGELST solves overdetermined or underdetermined systems for GE matrices using QR or LQ factorization with compact WY representation of Q.</b>
  2. *
  3. * =========== DOCUMENTATION ===========
  4. *
  5. * Online html documentation available at
  6. * http://www.netlib.org/lapack/explore-html/
  7. *
  8. *> \htmlonly
  9. *> Download SGELST + dependencies
  10. *> <a href="http://www.netlib.org/cgi-bin/netlibfiles.tgz?format=tgz&filename=/lapack/lapack_routine/sgelst.f">
  11. *> [TGZ]</a>
  12. *> <a href="http://www.netlib.org/cgi-bin/netlibfiles.zip?format=zip&filename=/lapack/lapack_routine/sgelst.f">
  13. *> [ZIP]</a>
  14. *> <a href="http://www.netlib.org/cgi-bin/netlibfiles.txt?format=txt&filename=/lapack/lapack_routine/sgelst.f">
  15. *> [TXT]</a>
  16. *> \endhtmlonly
  17. *
  18. * Definition:
  19. * ===========
  20. *
  21. * SUBROUTINE SGELST( TRANS, M, N, NRHS, A, LDA, B, LDB, WORK, LWORK,
  22. * INFO )
  23. *
  24. * .. Scalar Arguments ..
  25. * CHARACTER TRANS
  26. * INTEGER INFO, LDA, LDB, LWORK, M, N, NRHS
  27. * ..
  28. * .. Array Arguments ..
  29. * REAL A( LDA, * ), B( LDB, * ), WORK( * )
  30. * ..
  31. *
  32. *
  33. *> \par Purpose:
  34. * =============
  35. *>
  36. *> \verbatim
  37. *>
  38. *> SGELST solves overdetermined or underdetermined real linear systems
  39. *> involving an M-by-N matrix A, or its transpose, using a QR or LQ
  40. *> factorization of A with compact WY representation of Q.
  41. *> It is assumed that A has full rank.
  42. *>
  43. *> The following options are provided:
  44. *>
  45. *> 1. If TRANS = 'N' and m >= n: find the least squares solution of
  46. *> an overdetermined system, i.e., solve the least squares problem
  47. *> minimize || B - A*X ||.
  48. *>
  49. *> 2. If TRANS = 'N' and m < n: find the minimum norm solution of
  50. *> an underdetermined system A * X = B.
  51. *>
  52. *> 3. If TRANS = 'T' and m >= n: find the minimum norm solution of
  53. *> an underdetermined system A**T * X = B.
  54. *>
  55. *> 4. If TRANS = 'T' and m < n: find the least squares solution of
  56. *> an overdetermined system, i.e., solve the least squares problem
  57. *> minimize || B - A**T * X ||.
  58. *>
  59. *> Several right hand side vectors b and solution vectors x can be
  60. *> handled in a single call; they are stored as the columns of the
  61. *> M-by-NRHS right hand side matrix B and the N-by-NRHS solution
  62. *> matrix X.
  63. *> \endverbatim
  64. *
  65. * Arguments:
  66. * ==========
  67. *
  68. *> \param[in] TRANS
  69. *> \verbatim
  70. *> TRANS is CHARACTER*1
  71. *> = 'N': the linear system involves A;
  72. *> = 'T': the linear system involves A**T.
  73. *> \endverbatim
  74. *>
  75. *> \param[in] M
  76. *> \verbatim
  77. *> M is INTEGER
  78. *> The number of rows of the matrix A. M >= 0.
  79. *> \endverbatim
  80. *>
  81. *> \param[in] N
  82. *> \verbatim
  83. *> N is INTEGER
  84. *> The number of columns of the matrix A. N >= 0.
  85. *> \endverbatim
  86. *>
  87. *> \param[in] NRHS
  88. *> \verbatim
  89. *> NRHS is INTEGER
  90. *> The number of right hand sides, i.e., the number of
  91. *> columns of the matrices B and X. NRHS >=0.
  92. *> \endverbatim
  93. *>
  94. *> \param[in,out] A
  95. *> \verbatim
  96. *> A is REAL array, dimension (LDA,N)
  97. *> On entry, the M-by-N matrix A.
  98. *> On exit,
  99. *> if M >= N, A is overwritten by details of its QR
  100. *> factorization as returned by SGEQRT;
  101. *> if M < N, A is overwritten by details of its LQ
  102. *> factorization as returned by SGELQT.
  103. *> \endverbatim
  104. *>
  105. *> \param[in] LDA
  106. *> \verbatim
  107. *> LDA is INTEGER
  108. *> The leading dimension of the array A. LDA >= max(1,M).
  109. *> \endverbatim
  110. *>
  111. *> \param[in,out] B
  112. *> \verbatim
  113. *> B is REAL array, dimension (LDB,NRHS)
  114. *> On entry, the matrix B of right hand side vectors, stored
  115. *> columnwise; B is M-by-NRHS if TRANS = 'N', or N-by-NRHS
  116. *> if TRANS = 'T'.
  117. *> On exit, if INFO = 0, B is overwritten by the solution
  118. *> vectors, stored columnwise:
  119. *> if TRANS = 'N' and m >= n, rows 1 to n of B contain the least
  120. *> squares solution vectors; the residual sum of squares for the
  121. *> solution in each column is given by the sum of squares of
  122. *> elements N+1 to M in that column;
  123. *> if TRANS = 'N' and m < n, rows 1 to N of B contain the
  124. *> minimum norm solution vectors;
  125. *> if TRANS = 'T' and m >= n, rows 1 to M of B contain the
  126. *> minimum norm solution vectors;
  127. *> if TRANS = 'T' and m < n, rows 1 to M of B contain the
  128. *> least squares solution vectors; the residual sum of squares
  129. *> for the solution in each column is given by the sum of
  130. *> squares of elements M+1 to N in that column.
  131. *> \endverbatim
  132. *>
  133. *> \param[in] LDB
  134. *> \verbatim
  135. *> LDB is INTEGER
  136. *> The leading dimension of the array B. LDB >= MAX(1,M,N).
  137. *> \endverbatim
  138. *>
  139. *> \param[out] WORK
  140. *> \verbatim
  141. *> WORK is REAL array, dimension (MAX(1,LWORK))
  142. *> On exit, if INFO = 0, WORK(1) returns the optimal LWORK.
  143. *> \endverbatim
  144. *>
  145. *> \param[in] LWORK
  146. *> \verbatim
  147. *> LWORK is INTEGER
  148. *> The dimension of the array WORK.
  149. *> LWORK >= max( 1, MN + max( MN, NRHS ) ).
  150. *> For optimal performance,
  151. *> LWORK >= max( 1, (MN + max( MN, NRHS ))*NB ).
  152. *> where MN = min(M,N) and NB is the optimum block size.
  153. *>
  154. *> If LWORK = -1, then a workspace query is assumed; the routine
  155. *> only calculates the optimal size of the WORK array, returns
  156. *> this value as the first entry of the WORK array, and no error
  157. *> message related to LWORK is issued by XERBLA.
  158. *> \endverbatim
  159. *>
  160. *> \param[out] INFO
  161. *> \verbatim
  162. *> INFO is INTEGER
  163. *> = 0: successful exit
  164. *> < 0: if INFO = -i, the i-th argument had an illegal value
  165. *> > 0: if INFO = i, the i-th diagonal element of the
  166. *> triangular factor of A is zero, so that A does not have
  167. *> full rank; the least squares solution could not be
  168. *> computed.
  169. *> \endverbatim
  170. *
  171. * Authors:
  172. * ========
  173. *
  174. *> \author Univ. of Tennessee
  175. *> \author Univ. of California Berkeley
  176. *> \author Univ. of Colorado Denver
  177. *> \author NAG Ltd.
  178. *
  179. *> \ingroup gelst
  180. *
  181. *> \par Contributors:
  182. * ==================
  183. *>
  184. *> \verbatim
  185. *>
  186. *> November 2022, Igor Kozachenko,
  187. *> Computer Science Division,
  188. *> University of California, Berkeley
  189. *> \endverbatim
  190. *
  191. * =====================================================================
  192. SUBROUTINE SGELST( TRANS, M, N, NRHS, A, LDA, B, LDB, WORK, LWORK,
  193. $ INFO )
  194. *
  195. * -- LAPACK driver routine --
  196. * -- LAPACK is a software package provided by Univ. of Tennessee, --
  197. * -- Univ. of California Berkeley, Univ. of Colorado Denver and NAG Ltd..--
  198. *
  199. * .. Scalar Arguments ..
  200. CHARACTER TRANS
  201. INTEGER INFO, LDA, LDB, LWORK, M, N, NRHS
  202. * ..
  203. * .. Array Arguments ..
  204. REAL A( LDA, * ), B( LDB, * ), WORK( * )
  205. * ..
  206. *
  207. * =====================================================================
  208. *
  209. * .. Parameters ..
  210. REAL ZERO, ONE
  211. PARAMETER ( ZERO = 0.0E+0, ONE = 1.0E+0 )
  212. * ..
  213. * .. Local Scalars ..
  214. LOGICAL LQUERY, TPSD
  215. INTEGER BROW, I, IASCL, IBSCL, J, LWOPT, MN, MNNRHS,
  216. $ NB, NBMIN, SCLLEN
  217. REAL ANRM, BIGNUM, BNRM, SMLNUM
  218. * ..
  219. * .. Local Arrays ..
  220. REAL RWORK( 1 )
  221. * ..
  222. * .. External Functions ..
  223. LOGICAL LSAME
  224. INTEGER ILAENV
  225. REAL SLAMCH, SLANGE, SROUNDUP_LWORK
  226. EXTERNAL LSAME, ILAENV, SLAMCH, SLANGE, SROUNDUP_LWORK
  227. * ..
  228. * .. External Subroutines ..
  229. EXTERNAL SGELQT, SGEQRT, SGEMLQT, SGEMQRT,
  230. $ SLASCL, SLASET, STRTRS, XERBLA
  231. * ..
  232. * .. Intrinsic Functions ..
  233. INTRINSIC MAX, MIN
  234. * ..
  235. * .. Executable Statements ..
  236. *
  237. * Test the input arguments.
  238. *
  239. INFO = 0
  240. MN = MIN( M, N )
  241. LQUERY = ( LWORK.EQ.-1 )
  242. IF( .NOT.( LSAME( TRANS, 'N' ) .OR. LSAME( TRANS, 'T' ) ) ) THEN
  243. INFO = -1
  244. ELSE IF( M.LT.0 ) THEN
  245. INFO = -2
  246. ELSE IF( N.LT.0 ) THEN
  247. INFO = -3
  248. ELSE IF( NRHS.LT.0 ) THEN
  249. INFO = -4
  250. ELSE IF( LDA.LT.MAX( 1, M ) ) THEN
  251. INFO = -6
  252. ELSE IF( LDB.LT.MAX( 1, M, N ) ) THEN
  253. INFO = -8
  254. ELSE IF( LWORK.LT.MAX( 1, MN+MAX( MN, NRHS ) ) .AND. .NOT.LQUERY )
  255. $ THEN
  256. INFO = -10
  257. END IF
  258. *
  259. * Figure out optimal block size and optimal workspace size
  260. *
  261. IF( INFO.EQ.0 .OR. INFO.EQ.-10 ) THEN
  262. *
  263. TPSD = .TRUE.
  264. IF( LSAME( TRANS, 'N' ) )
  265. $ TPSD = .FALSE.
  266. *
  267. NB = ILAENV( 1, 'SGELST', ' ', M, N, -1, -1 )
  268. *
  269. MNNRHS = MAX( MN, NRHS )
  270. LWOPT = MAX( 1, (MN+MNNRHS)*NB )
  271. WORK( 1 ) = SROUNDUP_LWORK( LWOPT )
  272. *
  273. END IF
  274. *
  275. IF( INFO.NE.0 ) THEN
  276. CALL XERBLA( 'SGELST ', -INFO )
  277. RETURN
  278. ELSE IF( LQUERY ) THEN
  279. RETURN
  280. END IF
  281. *
  282. * Quick return if possible
  283. *
  284. IF( MIN( M, N, NRHS ).EQ.0 ) THEN
  285. CALL SLASET( 'Full', MAX( M, N ), NRHS, ZERO, ZERO, B, LDB )
  286. WORK( 1 ) = SROUNDUP_LWORK( LWOPT )
  287. RETURN
  288. END IF
  289. *
  290. * *GEQRT and *GELQT routines cannot accept NB larger than min(M,N)
  291. *
  292. IF( NB.GT.MN ) NB = MN
  293. *
  294. * Determine the block size from the supplied LWORK
  295. * ( at this stage we know that LWORK >= (minimum required workspace,
  296. * but it may be less than optimal)
  297. *
  298. NB = MIN( NB, LWORK/( MN + MNNRHS ) )
  299. *
  300. * The minimum value of NB, when blocked code is used
  301. *
  302. NBMIN = MAX( 2, ILAENV( 2, 'SGELST', ' ', M, N, -1, -1 ) )
  303. *
  304. IF( NB.LT.NBMIN ) THEN
  305. NB = 1
  306. END IF
  307. *
  308. * Get machine parameters
  309. *
  310. SMLNUM = SLAMCH( 'S' ) / SLAMCH( 'P' )
  311. BIGNUM = ONE / SMLNUM
  312. *
  313. * Scale A, B if max element outside range [SMLNUM,BIGNUM]
  314. *
  315. ANRM = SLANGE( 'M', M, N, A, LDA, RWORK )
  316. IASCL = 0
  317. IF( ANRM.GT.ZERO .AND. ANRM.LT.SMLNUM ) THEN
  318. *
  319. * Scale matrix norm up to SMLNUM
  320. *
  321. CALL SLASCL( 'G', 0, 0, ANRM, SMLNUM, M, N, A, LDA, INFO )
  322. IASCL = 1
  323. ELSE IF( ANRM.GT.BIGNUM ) THEN
  324. *
  325. * Scale matrix norm down to BIGNUM
  326. *
  327. CALL SLASCL( 'G', 0, 0, ANRM, BIGNUM, M, N, A, LDA, INFO )
  328. IASCL = 2
  329. ELSE IF( ANRM.EQ.ZERO ) THEN
  330. *
  331. * Matrix all zero. Return zero solution.
  332. *
  333. CALL SLASET( 'Full', MAX( M, N ), NRHS, ZERO, ZERO, B, LDB )
  334. WORK( 1 ) = SROUNDUP_LWORK( LWOPT )
  335. RETURN
  336. END IF
  337. *
  338. BROW = M
  339. IF( TPSD )
  340. $ BROW = N
  341. BNRM = SLANGE( 'M', BROW, NRHS, B, LDB, RWORK )
  342. IBSCL = 0
  343. IF( BNRM.GT.ZERO .AND. BNRM.LT.SMLNUM ) THEN
  344. *
  345. * Scale matrix norm up to SMLNUM
  346. *
  347. CALL SLASCL( 'G', 0, 0, BNRM, SMLNUM, BROW, NRHS, B, LDB,
  348. $ INFO )
  349. IBSCL = 1
  350. ELSE IF( BNRM.GT.BIGNUM ) THEN
  351. *
  352. * Scale matrix norm down to BIGNUM
  353. *
  354. CALL SLASCL( 'G', 0, 0, BNRM, BIGNUM, BROW, NRHS, B, LDB,
  355. $ INFO )
  356. IBSCL = 2
  357. END IF
  358. *
  359. IF( M.GE.N ) THEN
  360. *
  361. * M > N:
  362. * Compute the blocked QR factorization of A,
  363. * using the compact WY representation of Q,
  364. * workspace at least N, optimally N*NB.
  365. *
  366. CALL SGEQRT( M, N, NB, A, LDA, WORK( 1 ), NB,
  367. $ WORK( MN*NB+1 ), INFO )
  368. *
  369. IF( .NOT.TPSD ) THEN
  370. *
  371. * M > N, A is not transposed:
  372. * Overdetermined system of equations,
  373. * least-squares problem, min || A * X - B ||.
  374. *
  375. * Compute B(1:M,1:NRHS) := Q**T * B(1:M,1:NRHS),
  376. * using the compact WY representation of Q,
  377. * workspace at least NRHS, optimally NRHS*NB.
  378. *
  379. CALL SGEMQRT( 'Left', 'Transpose', M, NRHS, N, NB, A, LDA,
  380. $ WORK( 1 ), NB, B, LDB, WORK( MN*NB+1 ),
  381. $ INFO )
  382. *
  383. * Compute B(1:N,1:NRHS) := inv(R) * B(1:N,1:NRHS)
  384. *
  385. CALL STRTRS( 'Upper', 'No transpose', 'Non-unit', N, NRHS,
  386. $ A, LDA, B, LDB, INFO )
  387. *
  388. IF( INFO.GT.0 ) THEN
  389. RETURN
  390. END IF
  391. *
  392. SCLLEN = N
  393. *
  394. ELSE
  395. *
  396. * M > N, A is transposed:
  397. * Underdetermined system of equations,
  398. * minimum norm solution of A**T * X = B.
  399. *
  400. * Compute B := inv(R**T) * B in two row blocks of B.
  401. *
  402. * Block 1: B(1:N,1:NRHS) := inv(R**T) * B(1:N,1:NRHS)
  403. *
  404. CALL STRTRS( 'Upper', 'Transpose', 'Non-unit', N, NRHS,
  405. $ A, LDA, B, LDB, INFO )
  406. *
  407. IF( INFO.GT.0 ) THEN
  408. RETURN
  409. END IF
  410. *
  411. * Block 2: Zero out all rows below the N-th row in B:
  412. * B(N+1:M,1:NRHS) = ZERO
  413. *
  414. DO J = 1, NRHS
  415. DO I = N + 1, M
  416. B( I, J ) = ZERO
  417. END DO
  418. END DO
  419. *
  420. * Compute B(1:M,1:NRHS) := Q(1:N,:) * B(1:N,1:NRHS),
  421. * using the compact WY representation of Q,
  422. * workspace at least NRHS, optimally NRHS*NB.
  423. *
  424. CALL SGEMQRT( 'Left', 'No transpose', M, NRHS, N, NB,
  425. $ A, LDA, WORK( 1 ), NB, B, LDB,
  426. $ WORK( MN*NB+1 ), INFO )
  427. *
  428. SCLLEN = M
  429. *
  430. END IF
  431. *
  432. ELSE
  433. *
  434. * M < N:
  435. * Compute the blocked LQ factorization of A,
  436. * using the compact WY representation of Q,
  437. * workspace at least M, optimally M*NB.
  438. *
  439. CALL SGELQT( M, N, NB, A, LDA, WORK( 1 ), NB,
  440. $ WORK( MN*NB+1 ), INFO )
  441. *
  442. IF( .NOT.TPSD ) THEN
  443. *
  444. * M < N, A is not transposed:
  445. * Underdetermined system of equations,
  446. * minimum norm solution of A * X = B.
  447. *
  448. * Compute B := inv(L) * B in two row blocks of B.
  449. *
  450. * Block 1: B(1:M,1:NRHS) := inv(L) * B(1:M,1:NRHS)
  451. *
  452. CALL STRTRS( 'Lower', 'No transpose', 'Non-unit', M, NRHS,
  453. $ A, LDA, B, LDB, INFO )
  454. *
  455. IF( INFO.GT.0 ) THEN
  456. RETURN
  457. END IF
  458. *
  459. * Block 2: Zero out all rows below the M-th row in B:
  460. * B(M+1:N,1:NRHS) = ZERO
  461. *
  462. DO J = 1, NRHS
  463. DO I = M + 1, N
  464. B( I, J ) = ZERO
  465. END DO
  466. END DO
  467. *
  468. * Compute B(1:N,1:NRHS) := Q(1:N,:)**T * B(1:M,1:NRHS),
  469. * using the compact WY representation of Q,
  470. * workspace at least NRHS, optimally NRHS*NB.
  471. *
  472. CALL SGEMLQT( 'Left', 'Transpose', N, NRHS, M, NB, A, LDA,
  473. $ WORK( 1 ), NB, B, LDB,
  474. $ WORK( MN*NB+1 ), INFO )
  475. *
  476. SCLLEN = N
  477. *
  478. ELSE
  479. *
  480. * M < N, A is transposed:
  481. * Overdetermined system of equations,
  482. * least-squares problem, min || A**T * X - B ||.
  483. *
  484. * Compute B(1:N,1:NRHS) := Q * B(1:N,1:NRHS),
  485. * using the compact WY representation of Q,
  486. * workspace at least NRHS, optimally NRHS*NB.
  487. *
  488. CALL SGEMLQT( 'Left', 'No transpose', N, NRHS, M, NB,
  489. $ A, LDA, WORK( 1 ), NB, B, LDB,
  490. $ WORK( MN*NB+1), INFO )
  491. *
  492. * Compute B(1:M,1:NRHS) := inv(L**T) * B(1:M,1:NRHS)
  493. *
  494. CALL STRTRS( 'Lower', 'Transpose', 'Non-unit', M, NRHS,
  495. $ A, LDA, B, LDB, INFO )
  496. *
  497. IF( INFO.GT.0 ) THEN
  498. RETURN
  499. END IF
  500. *
  501. SCLLEN = M
  502. *
  503. END IF
  504. *
  505. END IF
  506. *
  507. * Undo scaling
  508. *
  509. IF( IASCL.EQ.1 ) THEN
  510. CALL SLASCL( 'G', 0, 0, ANRM, SMLNUM, SCLLEN, NRHS, B, LDB,
  511. $ INFO )
  512. ELSE IF( IASCL.EQ.2 ) THEN
  513. CALL SLASCL( 'G', 0, 0, ANRM, BIGNUM, SCLLEN, NRHS, B, LDB,
  514. $ INFO )
  515. END IF
  516. IF( IBSCL.EQ.1 ) THEN
  517. CALL SLASCL( 'G', 0, 0, SMLNUM, BNRM, SCLLEN, NRHS, B, LDB,
  518. $ INFO )
  519. ELSE IF( IBSCL.EQ.2 ) THEN
  520. CALL SLASCL( 'G', 0, 0, BIGNUM, BNRM, SCLLEN, NRHS, B, LDB,
  521. $ INFO )
  522. END IF
  523. *
  524. WORK( 1 ) = SROUNDUP_LWORK( LWOPT )
  525. *
  526. RETURN
  527. *
  528. * End of SGELST
  529. *
  530. END