3
4
5
6
7
8
9
10
11 INTEGER IA, INFO, JA, LIWORK, LWORK, N
12
13
14 INTEGER DESCA( * ), IPIV( * ), IWORK( * )
15 COMPLEX*16 A( * ), WORK( * )
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163 INTEGER BLOCK_CYCLIC_2D, CSRC_, CTXT_, DLEN_, DTYPE_,
164 $ LLD_, MB_, M_, NB_, N_, RSRC_
165 parameter( block_cyclic_2d = 1, dlen_ = 9, dtype_ = 1,
166 $ ctxt_ = 2, m_ = 3, n_ = 4, mb_ = 5, nb_ = 6,
167 $ rsrc_ = 7, csrc_ = 8, lld_ = 9 )
168 COMPLEX*16 ZERO, ONE
169 parameter( zero = 0.0d+0, one = 1.0d+0 )
170
171
172 LOGICAL LQUERY
173 INTEGER I, IACOL, IAROW, ICOFF, ICTXT, IROFF, IW, J,
174 $ JB, JN, LCM, LIWMIN, LWMIN, MP, MYCOL, MYROW,
175 $ NN, NP, NPCOL, NPROW, NQ
176
177
178 INTEGER DESCW( DLEN_ ), IDUM1( 2 ), IDUM2( 2 )
179
180
184
185
186 INTEGER ICEIL, ILCM, INDXG2P, NUMROC
188
189
190 INTRINSIC dble,
max,
min, mod
191
192
193
194
195
196 ictxt = desca( ctxt_ )
197 CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )
198
199
200
201 info = 0
202 IF( nprow.EQ.-1 ) THEN
203 info = -(500+ctxt_)
204 ELSE
205 CALL chk1mat( n, 1, n, 1, ia, ja, desca, 5, info )
206 IF( info.EQ.0 ) THEN
207 iroff = mod( ia-1, desca( mb_ ) )
208 icoff = mod( ja-1, desca( nb_ ) )
209 iarow =
indxg2p( ia, desca( mb_ ), myrow, desca( rsrc_ ),
210 $ nprow )
211 np =
numroc( n+iroff, desca( mb_ ), myrow, iarow, nprow )
212 lwmin = np * desca( nb_ )
213
214 mp =
numroc( desca( m_ ), desca( mb_ ), myrow,
215 $ desca( rsrc_ ), nprow )
216 nq =
numroc( desca( n_ ), desca( nb_ ), mycol,
217 $ desca( csrc_ ), npcol )
218 IF( nprow.EQ.npcol ) THEN
219 liwmin = nq + desca( nb_ )
220 ELSE
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246 lcm =
ilcm( nprow, npcol )
247 liwmin =
numroc( desca( m_ ) + desca( mb_ ) * nprow
248 $ + mod( ia - 1, desca( mb_ ) ), desca( nb_ ),
249 $ mycol, desca( csrc_ ), npcol ) +
251 $
numroc( desca( m_ ) + desca( mb_ ) * nprow,
252 $ desca( mb_ ), myrow, desca( rsrc_ ), nprow ),
253 $ desca( mb_ ) ), lcm / nprow ), desca( nb_ ) )
254
255 END IF
256
257 work( 1 ) = dble( lwmin )
258 iwork( 1 ) = liwmin
259 lquery = ( lwork.EQ.-1 .OR. liwork.EQ.-1 )
260 IF( iroff.NE.icoff .OR. iroff.NE.0 ) THEN
261 info = -4
262 ELSE IF( desca( mb_ ).NE.desca( nb_ ) ) THEN
263 info = -(500+nb_)
264 ELSE IF( lwork.LT.lwmin .AND. .NOT.lquery ) THEN
265 info = -8
266 ELSE IF( liwork.LT.liwmin .AND. .NOT.lquery ) THEN
267 info = -10
268 END IF
269 END IF
270 IF( lwork.EQ.-1 ) THEN
271 idum1( 1 ) = -1
272 ELSE
273 idum1( 1 ) = 1
274 END IF
275 idum2( 1 ) = 8
276 IF( liwork.EQ.-1 ) THEN
277 idum1( 2 ) = -1
278 ELSE
279 idum1( 2 ) = 1
280 END IF
281 idum2( 2 ) = 10
282 CALL pchk1mat( n, 1, n, 1, ia, ja, desca, 5, 2, idum1, idum2,
283 $ info )
284 END IF
285
286 IF( info.NE.0 ) THEN
287 CALL pxerbla( ictxt,
'PZGETRI', -info )
288 RETURN
289 ELSE IF( lquery ) THEN
290 RETURN
291 END IF
292
293
294
295 IF( n.EQ.0 )
296 $ RETURN
297
298
299
300
301 CALL pztrtri(
'Upper',
'Non-unit', n, a, ia, ja, desca, info )
302 IF( info.GT.0 )
303 $ RETURN
304
305
306
307 jn =
min(
iceil( ja, desca( nb_ ) ) * desca( nb_ ), ja+n-1 )
308 nn = ( ( ja+n-2 ) / desca( nb_ ) ) * desca( nb_ ) + 1
309 iacol =
indxg2p( nn, desca( nb_ ), mycol, desca( csrc_ ), npcol )
310 CALL descset( descw, n+iroff, desca( nb_ ), desca( mb_ ),
311 $ desca( nb_ ), iarow, iacol, ictxt,
max( 1, np ) )
312 iw = iroff + 1
313
314
315
316 DO 10 j = nn, jn+1, -desca( nb_ )
317 jb =
min( desca( nb_ ), ja+n-j )
318 i = ia + j - ja
319
320
321
322 CALL pzlacpy(
'Lower', ja+n-1-j, jb, a, i+1, j, desca,
323 $ work, iw+j-ja+1, 1, descw )
324 CALL pzlaset(
'Lower', ja+n-1-j, jb, zero, zero, a, i+1, j,
325 $ desca )
326
327
328
329 IF( j+jb.LE.ja+n-1 )
330 $ CALL pzgemm( 'No transpose', 'No transpose', n, jb,
331 $ ja+n-j-jb, -one, a, ia, j+jb, desca, work,
332 $ iw+j+jb-ja, 1, descw, one, a, ia, j, desca )
333 CALL pztrsm( 'Right', 'Lower', 'No transpose', 'Unit', n, jb,
334 $ one, work, iw+j-ja, 1, descw, a, ia, j, desca )
335 descw( csrc_ ) = mod( descw( csrc_ ) + npcol - 1, npcol )
336
337 10 CONTINUE
338
339
340
341 jb = jn-ja+1
342
343
344
345 CALL pzlacpy(
'Lower', n-1, jb, a, ia+1, ja, desca, work, iw+1,
346 $ 1, descw )
347 CALL pzlaset(
'Lower', n-1, jb, zero, zero, a, ia+1, ja, desca )
348
349
350
351 IF( ja+jb.LE.ja+n-1 )
352 $ CALL pzgemm( 'No transpose', 'No transpose', n, jb,
353 $ n-jb, -one, a, ia, ja+jb, desca, work, iw+jb, 1,
354 $ descw, one, a, ia, ja, desca )
355 CALL pztrsm( 'Right', 'Lower', 'No transpose', 'Unit', n, jb,
356 $ one, work, iw, 1, descw, a, ia, ja, desca )
357
358
359
360
361 CALL descset( descw, desca( m_ ) + desca( mb_ )*nprow, 1,
362 $ desca( mb_ ), 1, desca( rsrc_ ), mycol, ictxt,
363 $ mp+desca( mb_ ) )
364 CALL pzlapiv(
'Backward',
'Columns',
'Column', n, n, a, ia,
365 $ ja, desca, ipiv, ia, 1, descw, iwork )
366
367 work( 1 ) = dble( lwmin )
368 iwork( 1 ) = liwmin
369
370 RETURN
371
372
373
subroutine chk1mat(ma, mapos0, na, napos0, ia, ja, desca, descapos0, info)
subroutine descset(desc, m, n, mb, nb, irsrc, icsrc, ictxt, lld)
integer function iceil(inum, idenom)
integer function ilcm(m, n)
integer function indxg2p(indxglob, nb, iproc, isrcproc, nprocs)
integer function numroc(n, nb, iproc, isrcproc, nprocs)
subroutine pchk1mat(ma, mapos0, na, napos0, ia, ja, desca, descapos0, nextra, ex, expos, info)
subroutine pxerbla(ictxt, srname, info)
subroutine pzlaset(uplo, m, n, alpha, beta, a, ia, ja, desca)
subroutine pzlacpy(uplo, m, n, a, ia, ja, desca, b, ib, jb, descb)
subroutine pzlapiv(direc, rowcol, pivroc, m, n, a, ia, ja, desca, ipiv, ip, jp, descip, iwork)
subroutine pztrtri(uplo, diag, n, a, ia, ja, desca, info)