PLASMA  2.4.5
PLASMA - Parallel Linear Algebra for Scalable Multi-core Architectures
 All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Groups
clqt03.f
Go to the documentation of this file.
1  SUBROUTINE clqt03( M, N, K, AF, C, CC, Q, LDA, T, WORK, LWORK,
2  $ rwork, result )
3 *
4  include 'plasmaf.h'
5 *
6 * -- LAPACK test routine (version 3.1) --
7 * Univ. of Tennessee, Univ. of California Berkeley and NAG Ltd..
8 * November 2006
9 *
10 * .. Scalar Arguments ..
11  INTEGER k, lda, lwork, m, n
12  INTEGER t( 2 )
13 * ..
14 * .. Array Arguments ..
15  REAL result( * ), rwork( * )
16  COMPLEX af( lda, * ), c( lda, * ), cc( lda, * ),
17  $ q( lda, * ), work( lwork )
18 * ..
19 *
20 * Purpose
21 * =======
22 *
23 * CLQT03 tests CUNMLQ, which computes Q*C, Q'*C, C*Q or C*Q'.
24 *
25 * CLQT03 compares the results of a call to CUNMLQ with the results of
26 * forming Q explicitly by a call to CUNGLQ and then performing matrix
27 * multiplication by a call to CGEMM.
28 *
29 * Arguments
30 * =========
31 *
32 * M (input) INTEGER
33 * The number of rows or columns of the matrix C; C is n-by-m if
34 * Q is applied from the left, or m-by-n if Q is applied from
35 * the right. M >= 0.
36 *
37 * N (input) INTEGER
38 * The order of the orthogonal matrix Q. N >= 0.
39 *
40 * K (input) INTEGER
41 * The number of elementary reflectors whose product defines the
42 * orthogonal matrix Q. N >= K >= 0.
43 *
44 * AF (input) COMPLEX array, dimension (LDA,N)
45 * Details of the LQ factorization of an m-by-n matrix, as
46 * returned by CGELQF. See CGELQF for further details.
47 *
48 * C (workspace) COMPLEX array, dimension (LDA,N)
49 *
50 * CC (workspace) COMPLEX array, dimension (LDA,N)
51 *
52 * Q (workspace) COMPLEX array, dimension (LDA,N)
53 *
54 * LDA (input) INTEGER
55 * The leading dimension of the arrays AF, C, CC, and Q.
56 *
57 * TAU (input) COMPLEX array, dimension (min(M,N))
58 * The scalar factors of the elementary reflectors corresponding
59 * to the LQ factorization in AF.
60 *
61 * WORK (workspace) COMPLEX array, dimension (LWORK)
62 *
63 * LWORK (input) INTEGER
64 * The length of WORK. LWORK must be at least M, and should be
65 * M*NB, where NB is the blocksize for this environment.
66 *
67 * RWORK (workspace) REAL array, dimension (M)
68 *
69 * RESULT (output) REAL array, dimension (4)
70 * The test ratios compare two techniques for multiplying a
71 * random matrix C by an n-by-n orthogonal matrix Q.
72 * RESULT(1) = norm( Q*C - Q*C ) / ( N * norm(C) * EPS )
73 * RESULT(2) = norm( C*Q - C*Q ) / ( N * norm(C) * EPS )
74 * RESULT(3) = norm( Q'*C - Q'*C )/ ( N * norm(C) * EPS )
75 * RESULT(4) = norm( C*Q' - C*Q' )/ ( N * norm(C) * EPS )
76 *
77 * =====================================================================
78 *
79 * .. Parameters ..
80  REAL zero, one
81  parameter( zero = 0.0e+0, one = 1.0e+0 )
82  COMPLEX rogue
83  parameter( rogue = ( -1.0e+10, -1.0e+10 ) )
84 * ..
85 * .. Local Scalars ..
86  CHARACTER side, trans
87  INTEGER info, iside, itrans, j, mc, nc
88  INTEGER plasma_side, plasma_trans
89  REAL cnorm, eps, resid
90 * ..
91 * .. External Functions ..
92  LOGICAL lsame
93  REAL clange, slamch
94  EXTERNAL lsame, clange, slamch
95 * ..
96 * .. External Subroutines ..
97  EXTERNAL cgemm, clacpy, clarnv, claset, cunglq, cunmlq
98 * ..
99 * .. Local Arrays ..
100  INTEGER iseed( 4 )
101 * ..
102 * .. Intrinsic Functions ..
103  INTRINSIC cmplx, max, real
104 * ..
105 * .. Scalars in Common ..
106  CHARACTER*32 srnamt
107 * ..
108 * .. Common blocks ..
109  common / srnamc / srnamt
110 * ..
111 * .. Data statements ..
112  DATA iseed / 1988, 1989, 1990, 1991 /
113 * ..
114 * .. Executable Statements ..
115 *
116  eps = slamch( 'Epsilon' )
117 *
118 * Copy the first k rows of the factorization to the array Q
119 *
120  IF ( k.EQ.0 ) THEN
121  CALL claset( 'Full', n, n, rogue, rogue, q, lda )
122  ELSE
123  CALL claset( 'Full', n, n, cmplx( zero ), cmplx( one ),
124  $ q, lda )
125  ENDIF
126 *
127 * Generate the n-by-n matrix Q
128 *
129  srnamt = 'CUNGLQ'
130  CALL plasma_cunglq( n, n, k, af, lda, t, q, lda, info )
131 *
132  DO 30 iside = 1, 2
133  IF( iside.EQ.1 ) THEN
134  side = 'L'
135  plasma_side = plasmaleft
136  mc = n
137  nc = m
138  ELSE
139  side = 'R'
140  plasma_side = plasmaright
141  mc = m
142  nc = n
143  END IF
144 *
145 * Generate MC by NC matrix C
146 *
147  DO 10 j = 1, nc
148  CALL clarnv( 2, iseed, mc, c( 1, j ) )
149  10 continue
150  cnorm = clange( '1', mc, nc, c, lda, rwork )
151  IF( cnorm.EQ.zero )
152  $ cnorm = one
153 *
154 * DO 20 ITRANS = 1, 2
155  DO 20 itrans = 2, 2
156 * ONLY CONJTRANS SUPPORTED !!!!
157  IF( itrans.EQ.1 ) THEN
158  trans = 'N'
159  plasma_trans = plasmanotrans
160  ELSE
161  trans = 'C'
162  plasma_trans = plasmaconjtrans
163  END IF
164 *
165 * Copy C
166 *
167  CALL clacpy( 'Full', mc, nc, c, lda, cc, lda )
168 *
169 * Apply Q or Q' to C
170 *
171  srnamt = 'CUNMLQ'
172  CALL plasma_cunmlq( plasma_side, plasma_trans, mc, nc, k,
173  $ af, lda, t, cc, lda, info )
174 *
175 * Form explicit product and subtract
176 *
177  IF ( k.EQ.0 ) THEN
178  CALL claset( 'Full', n, n, cmplx( zero ),
179  $ cmplx( one ), q, lda )
180  ENDIF
181  IF( lsame( side, 'L' ) ) THEN
182  CALL cgemm( trans, 'No transpose', mc, nc, mc,
183  $ cmplx( -one ), q, lda, c, lda, cmplx( one ),
184  $ cc, lda )
185  ELSE
186  CALL cgemm( 'No transpose', trans, mc, nc, nc,
187  $ cmplx( -one ), c, lda, q, lda, cmplx( one ),
188  $ cc, lda )
189  END IF
190 *
191 * Compute error in the difference
192 *
193  resid = clange( '1', mc, nc, cc, lda, rwork )
194  result( ( iside-1 )*2+itrans ) = resid /
195  $ ( REAL( MAX( 1, N ) )*cnorm*eps )
196 *
197  20 continue
198  30 continue
199 *
200  return
201 *
202 * End of CLQT03
203 *
204  END