3
4
5
6
7
8
9 INTEGER BWL, BWU, INFO, JA, LAF, LWORK, N
10
11
12 INTEGER DESCA( * )
13 COMPLEX A( * ), AF( * ), WORK( * )
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348 REAL ONE, ZERO
349 parameter( one = 1.0e+0 )
350 parameter( zero = 0.0e+0 )
351 COMPLEX CONE, CZERO
352 parameter( cone = ( 1.0e+0, 0.0e+0 ) )
353 parameter( czero = ( 0.0e+0, 0.0e+0 ) )
354 INTEGER INT_ONE
355 parameter( int_one = 1 )
356 INTEGER DESCMULT, BIGNUM
357 parameter(descmult = 100, bignum = descmult * descmult)
358 INTEGER BLOCK_CYCLIC_2D, CSRC_, CTXT_, DLEN_, DTYPE_,
359 $ LLD_, MB_, M_, NB_, N_, RSRC_
360 parameter( block_cyclic_2d = 1, dlen_ = 9, dtype_ = 1,
361 $ ctxt_ = 2, m_ = 3, n_ = 4, mb_ = 5, nb_ = 6,
362 $ rsrc_ = 7, csrc_ = 8, lld_ = 9 )
363
364
365 INTEGER COMM_PROC, CSRC, FIRST_PROC, I, ICTXT,
366 $ ICTXT_NEW, ICTXT_SAVE, IDUM3, JA_NEW, LAF_MIN,
367 $ LEVEL_DIST, LLDA, MAX_BW, MBW2, MYCOL, MYROW,
368 $ MY_NUM_COLS, NB, NEXT_TRI_SIZE_M,
369 $ NEXT_TRI_SIZE_N, NP, NPCOL, NPROW, NP_SAVE,
370 $ ODD_SIZE, OFST, PART_OFFSET, PART_SIZE,
371 $ PREV_TRI_SIZE_M, PREV_TRI_SIZE_N, RETURN_CODE,
372 $ STORE_N_A, UP_PREV_TRI_SIZE_M,
373 $ UP_PREV_TRI_SIZE_N, WORK_SIZE_MIN, WORK_U
374
375
376 INTEGER DESCA_1XP( 7 ), PARAM_CHECK( 9, 3 )
377
378
379 EXTERNAL blacs_get, blacs_gridexit, blacs_gridinfo,
380 $ caxpy, cgemm, cgerv2d, cgesd2d, clamov,
381 $
clatcpy, cpbtrf, cpotrf, csyrk, ctbtrs, ctrmm,
384
385
386 LOGICAL LSAME
387 INTEGER NUMROC
389
390
391 INTRINSIC ichar,
min, mod
392
393
394
395
396
397 info = 0
398
399
400
401
402 desca_1xp( 1 ) = 501
403
405
406 IF( return_code .NE. 0) THEN
407 info = -( 6*100 + 2 )
408 ENDIF
409
410
411
412 ictxt = desca_1xp( 2 )
413 csrc = desca_1xp( 5 )
414 nb = desca_1xp( 4 )
415 llda = desca_1xp( 6 )
416 store_n_a = desca_1xp( 3 )
417
418
419
420
421
422
423 max_bw =
max(bwl,bwu)
424 mbw2 = max_bw * max_bw
425
426 CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )
427 np = nprow * npcol
428
429
430
431 IF( lwork .LT. -1) THEN
432 info = -10
433 ELSE IF ( lwork .EQ. -1 ) THEN
434 idum3 = -1
435 ELSE
436 idum3 = 1
437 ENDIF
438
439 IF( n .LT. 0 ) THEN
440 info = -1
441 ENDIF
442
443 IF( n+ja-1 .GT. store_n_a ) THEN
444 info = -( 6*100 + 6 )
445 ENDIF
446
447 IF(( bwl .GT. n-1 ) .OR.
448 $ ( bwl .LT. 0 ) ) THEN
449 info = -2
450 ENDIF
451
452 IF(( bwu .GT. n-1 ) .OR.
453 $ ( bwu .LT. 0 ) ) THEN
454 info = -3
455 ENDIF
456
457 IF( llda .LT. (bwl+bwu+1) ) THEN
458 info = -( 6*100 + 6 )
459 ENDIF
460
461 IF( nb .LE. 0 ) THEN
462 info = -( 6*100 + 4 )
463 ENDIF
464
465
466
467 IF( nprow .NE. 1 ) THEN
468 info = -( 6*100+2 )
469 ENDIF
470
471 IF( n .GT. np*nb-mod( ja-1, nb )) THEN
472 info = -( 1 )
474 $ 'PCDBTRF, D&C alg.: only 1 block per proc',
475 $ -info )
476 RETURN
477 ENDIF
478
479 IF((ja+n-1.GT.nb) .AND. ( nb.LT.2*
max(bwl,bwu) ))
THEN
480 info = -( 6*100+4 )
482 $ 'PCDBTRF, D&C alg.: NB too small',
483 $ -info )
484 RETURN
485 ENDIF
486
487
488
489
490 laf_min = nb*(bwl+bwu)+6*
max(bwl,bwu)*
max(bwl,bwu)
491
492 IF( laf .LT. laf_min ) THEN
493 info = -8
494
495 af( 1 ) = laf_min
497 $ 'PCDBTRF: auxiliary storage error ',
498 $ -info )
499 RETURN
500 ENDIF
501
502
503
504 work_size_min =
max(bwl,bwu)*
max(bwl,bwu)
505
506 work( 1 ) = work_size_min
507
508 IF( lwork .LT. work_size_min ) THEN
509 IF( lwork .NE. -1 ) THEN
510 info = -10
512 $ 'PCDBTRF: worksize error ',
513 $ -info )
514 ENDIF
515 RETURN
516 ENDIF
517
518
519
520 param_check( 9, 1 ) = desca(5)
521 param_check( 8, 1 ) = desca(4)
522 param_check( 7, 1 ) = desca(3)
523 param_check( 6, 1 ) = desca(1)
524 param_check( 5, 1 ) = ja
525 param_check( 4, 1 ) = bwu
526 param_check( 3, 1 ) = bwl
527 param_check( 2, 1 ) = n
528 param_check( 1, 1 ) = idum3
529
530 param_check( 9, 2 ) = 605
531 param_check( 8, 2 ) = 604
532 param_check( 7, 2 ) = 603
533 param_check( 6, 2 ) = 601
534 param_check( 5, 2 ) = 5
535 param_check( 4, 2 ) = 3
536 param_check( 3, 2 ) = 2
537 param_check( 2, 2 ) = 1
538 param_check( 1, 2 ) = 10
539
540
541
542
543
544 IF( info.GE.0 ) THEN
545 info = bignum
546 ELSE IF( info.LT.-descmult ) THEN
547 info = -info
548 ELSE
549 info = -info * descmult
550 END IF
551
552
553
554 CALL globchk( ictxt, 9, param_check, 9,
555 $ param_check( 1, 3 ), info )
556
557
558
559
560 IF( info.EQ.bignum ) THEN
561 info = 0
562 ELSE IF( mod( info, descmult ) .EQ. 0 ) THEN
563 info = -info / descmult
564 ELSE
565 info = -info
566 END IF
567
568 IF( info.LT.0 ) THEN
569 CALL pxerbla( ictxt,
'PCDBTRF', -info )
570 RETURN
571 END IF
572
573
574
575 IF( n.EQ.0 )
576 $ RETURN
577
578
579
580
581
582 part_offset = nb*( (ja-1)/(npcol*nb) )
583
584 IF ( (mycol-csrc) .LT. (ja-part_offset-1)/nb ) THEN
585 part_offset = part_offset + nb
586 ENDIF
587
588 IF ( mycol .LT. csrc ) THEN
589 part_offset = part_offset - nb
590 ENDIF
591
592
593
594
595
596
597
598 first_proc = mod( ( ja-1 )/nb+csrc, npcol )
599
600
601
602 ja_new = mod( ja-1, nb ) + 1
603
604
605
606 np_save = np
607 np = ( ja_new+n-2 )/nb + 1
608
609
610
611 CALL reshape( ictxt, int_one, ictxt_new, int_one,
612 $ first_proc, int_one, np )
613
614
615
616 ictxt_save = ictxt
617 ictxt = ictxt_new
618 desca_1xp( 2 ) = ictxt_new
619
620
621
622 CALL blacs_gridinfo( ictxt, nprow, npcol, myrow, mycol )
623
624
625
626 IF( myrow .LT. 0 ) THEN
627 GOTO 1234
628 ENDIF
629
630
631
632
633
634
635 part_size = nb
636
637
638
639 my_num_cols =
numroc( n, part_size, mycol, 0, npcol )
640
641
642
643 IF ( mycol .EQ. 0 ) THEN
644 part_offset = part_offset+mod( ja_new-1, part_size )
645 my_num_cols = my_num_cols - mod(ja_new-1, part_size )
646 ENDIF
647
648
649
650 ofst = part_offset*llda
651
652
653
654 odd_size = my_num_cols
655 IF ( mycol .LT. np-1 ) THEN
656 odd_size = odd_size - max_bw
657 ENDIF
658
659
660
661 work_u = bwu*odd_size + 3*mbw2
662
663
664
665
666 DO 10 i=1, laf_min
667 af( i ) = czero
668 10 CONTINUE
669
670
671
672 DO 20 i=1, work_size_min
673 work( i ) = czero
674 20 CONTINUE
675
676
677
678
679
680
681
682
683
684
685
686 IF( mycol .GT. 0 ) THEN
687 prev_tri_size_m=
min( bwl,
688 $
numroc( n, part_size, mycol, 0, npcol ) )
689 prev_tri_size_n=
min( bwl,
690 $
numroc( n, part_size, mycol-1, 0, npcol ) )
691 ENDIF
692
693 IF( mycol .GT. 0 ) THEN
694 up_prev_tri_size_m=
min( bwu,
695 $
numroc( n, part_size, mycol, 0, npcol ) )
696 up_prev_tri_size_n=
min( bwu,
697 $
numroc( n, part_size, mycol-1, 0, npcol ) )
698 ENDIF
699
700 IF( mycol .LT. npcol-1 ) THEN
701 next_tri_size_m=
min( bwl,
702 $
numroc( n, part_size, mycol+1, 0, npcol ) )
703 next_tri_size_n=
min( bwl,
704 $
numroc( n, part_size, mycol, 0, npcol ) )
705 ENDIF
706
707 IF ( mycol .LT. np-1 ) THEN
708
709
710
711
712
713 CALL ctrsd2d( ictxt, 'U', 'N', next_tri_size_m,
714 $ next_tri_size_n,
715 $ a( ofst+(my_num_cols-bwl)*llda+(bwl+bwu+1) ),
716 $ llda-1, 0, mycol+1 )
717
718 ENDIF
719
720
721
722
723 CALL cdbtrf( odd_size, odd_size, bwl, bwu, a( ofst + 1),
724 $ llda, info )
725
726 IF( info.NE.0 ) THEN
727 info = mycol+1
728 GOTO 1500
729 ENDIF
730
731
732 IF ( mycol .LT. np-1 ) THEN
733
734
735
736
737
738
740 $ a(( ofst+(bwl+bwu+1)+(odd_size-bwl)*llda )),
741 $ llda-1, af( odd_size*bwu+2*mbw2+1+max_bw-bwl ),
742 $ max_bw )
743 CALL clamov( 'L', bwu, bwu, a( ( ofst+1+odd_size*llda ) ),
744 $ llda-1,
745 $ af( work_u+odd_size*bwl+2*mbw2+1+max_bw-bwu ),
746 $ max_bw )
747
748
749
750 CALL ctbtrs( 'L', 'N', 'U', bwu, bwl, bwu,
751 $ a( ofst+bwu+1+(odd_size-bwu )*llda ), llda,
752 $ af( work_u+odd_size*bwl+2*mbw2+1+max_bw-bwu ),
753 $ max_bw, info )
754
755
756
757 CALL ctbtrs( 'U', 'C', 'N', bwl, bwu, bwl,
758 $ a( ofst+1+(odd_size-bwl)*llda ), llda,
759 $ af( odd_size*bwu+2*mbw2+1+max_bw-bwl ), max_bw,
760 $ info )
761
762
763
764
766 $ af( odd_size*bwu+2*mbw2+1+max_bw-bwl ), max_bw,
767 $ a(( ofst+(bwl+bwu+1)+(odd_size-bwl)*llda )),
768 $ llda-1 )
769
770
771
772 CALL clamov( 'L', bwu, bwu,
773 $ af( work_u+odd_size*bwl+2*mbw2+1+max_bw-bwu ),
774 $ max_bw, a(( ofst+1+odd_size*llda )), llda-1 )
775
776
777
778
779
780
781
782
783
784 CALL cgemm( 'C', 'N', max_bw, max_bw, max_bw, -cone ,
785 $ af( odd_size*bwu+2*mbw2+1), max_bw,
786 $ af( work_u+odd_size*bwl+2*mbw2+1), max_bw, cone,
787 $ a( ofst+odd_size*llda+1+bwu ), llda-1 )
788
789 ENDIF
790
791
792
793 1500 CONTINUE
794
795
796 IF ( mycol .NE. 0 ) THEN
797
798
799
800
801
802
803
804
805
806 CALL ctrrv2d( ictxt, 'U', 'N', prev_tri_size_m,
807 $ prev_tri_size_n, af( work_u+1 ), odd_size, 0,
808 $ mycol-1 )
809
810 IF (info.EQ.0) THEN
811
812
813
814 CALL ctbtrs( 'L', 'N', 'U', odd_size, bwl, bwl,
815 $ a( ofst + bwu+1 ), llda, af( work_u+1 ),
816 $ odd_size, info )
817
818
819
820
821
822
823
824 CALL clatcpy(
'L', up_prev_tri_size_n, up_prev_tri_size_m,
825 $ a( ofst+1 ), llda-1, af( 1 ), odd_size )
826
827 CALL ctbtrs( 'U', 'C', 'N', odd_size, bwu, bwu,
828 $ a( ofst + 1 ), llda,
829 $ af( 1 ), odd_size, info )
830
831
832
833
834
835
836
837 DO 30 i=1, mbw2
838 af( odd_size*bwu+2*mbw2+i ) = czero
839 30 CONTINUE
840
841 CALL cgemm( 'C', 'N', bwu, bwl, odd_size,
842 $ -cone, af( 1 ), odd_size,
843 $ af( work_u+1 ), odd_size, czero,
844 $ af( 1+
max(0,bwl-bwu)+odd_size*bwu+
845 $ (2*max_bw+
max(0,bwu-bwl))*max_bw),
846 $ max_bw )
847
848
849
850
851
852 CALL cgesd2d( ictxt, max_bw, max_bw,
853 $ af( odd_size*bwu+2*mbw2+1 ), max_bw, 0,
854 $ mycol-1 )
855
856
857 IF ( mycol .LT. np-1 ) THEN
858
859
860
861
862
863
864
865
866
867
869 $ af( work_u+odd_size-bwl+1 ), odd_size,
870 $ af( (odd_size)*bwu+1+(max_bw-bwl) ),
871 $ max_bw )
872
873 CALL ctrmm( 'R', 'U', 'C', 'N', bwl, bwl, -cone,
874 $ a( ( ofst+(bwl+bwu+1)+(odd_size-bwl)*llda ) ),
875 $ llda-1, af( (odd_size)*bwu+1+(max_bw-bwl) ),
876 $ max_bw )
877
878
879
880
881
882
883
885 $ af( odd_size-bwu+1 ), odd_size,
886 $ af( work_u+(odd_size)*bwl+1+max_bw-bwu ),
887 $ max_bw )
888
889 CALL ctrmm( 'R', 'L', 'N', 'N', bwu, bwu, -cone,
890 $ a( ( ofst+1+odd_size*llda ) ), llda-1,
891 $ af( work_u+(odd_size)*bwl+1+max_bw-bwu ),
892 $ max_bw )
893
894 ENDIF
895
896 ENDIF
897
898
899 ENDIF
900
901
902
903
904
905 CALL igamx2d( ictxt, 'A', ' ', 1, 1, info, 1, info, info,
906 $ -1, 0, 0 )
907
908 IF( mycol.EQ.0 ) THEN
909 CALL igebs2d( ictxt, 'A', ' ', 1, 1, info, 1 )
910 ELSE
911 CALL igebr2d( ictxt, 'A', ' ', 1, 1, info, 1, 0, 0 )
912 ENDIF
913
914 IF ( info.NE.0 ) THEN
915 GOTO 1000
916 ENDIF
917
918
919
920
921
922
923
924
925
926
927
928
929 IF( mycol .EQ. npcol-1 ) THEN
930 GOTO 14
931 ENDIF
932
933
934
935
936
937 IF( (mod( mycol+1, 2 ) .EQ. 0) .AND. ( mycol .GT. 0 ) ) THEN
938
939 CALL cgesd2d( ictxt, max_bw, max_bw,
940 $ af( odd_size*bwu+1 ),
941 $ max_bw, 0, mycol-1 )
942
943 CALL cgesd2d( ictxt, max_bw, max_bw,
944 $ af( work_u+odd_size*bwl+1 ),
945 $ max_bw, 0, mycol-1 )
946
947 ENDIF
948
949
950
951
952 CALL clamov( 'N', max_bw, max_bw,
953 $ a( ofst+odd_size*llda+bwu+1 ),
954 $ llda-1, af( odd_size*bwu+mbw2+1 ),
955 $ max_bw )
956
957
958
959 IF( mycol.LT. npcol-1 ) THEN
960
961 CALL cgerv2d( ictxt, max_bw, max_bw,
962 $ af( odd_size*bwu+2*mbw2+1 ),
963 $ max_bw, 0,
964 $ mycol+1 )
965
966
967
968 CALL caxpy( mbw2, cone,
969 $ af( odd_size*bwu+2*mbw2+1 ),
970 $ 1, af( odd_size*bwu+mbw2+1 ), 1 )
971
972 ENDIF
973
974
975
976
977
978
979
980 level_dist = 1
981
982
983
984 12 CONTINUE
985 IF( mod( (mycol+1)/level_dist, 2) .NE. 0 ) GOTO 11
986
987
988
989 IF( mycol-level_dist .GE. 0 ) THEN
990 CALL cgerv2d( ictxt, max_bw, max_bw, work( 1 ),
991 $ max_bw, 0, mycol-level_dist )
992
993 CALL caxpy( mbw2, cone, work( 1 ), 1,
994 $ af( odd_size*bwu+mbw2+1 ), 1 )
995
996 ENDIF
997
998
999
1000 IF( mycol+level_dist .LT. npcol-1 ) THEN
1001 CALL cgerv2d( ictxt, max_bw, max_bw, work( 1 ),
1002 $ max_bw, 0, mycol+level_dist )
1003
1004 CALL caxpy( mbw2, cone, work( 1 ), 1,
1005 $ af( odd_size*bwu+mbw2+1 ), 1 )
1006
1007 ENDIF
1008
1009 level_dist = level_dist*2
1010
1011 GOTO 12
1012 11 CONTINUE
1013
1014
1015
1016
1017
1018
1019
1020
1021 CALL cdbtrf( max_bw, max_bw,
min( max_bw-1, bwl ),
1022 $
min( max_bw-1, bwu ), af( odd_size*bwu+mbw2+1
1023 $ -(
min( max_bw-1, bwu ))), max_bw+1, info )
1024
1025 IF( info.NE.0 ) THEN
1026 info = npcol + mycol
1027 ENDIF
1028
1029
1030
1031
1032
1033
1034 IF( level_dist .EQ. 1 )THEN
1035 comm_proc = mycol + 1
1036
1037
1038
1039
1040 CALL clamov( 'N', max_bw, max_bw, af( odd_size*bwu+1 ),
1041 $ max_bw, af( work_u+odd_size*bwl+2*mbw2+1 ),
1042 $ max_bw )
1043
1044 CALL clamov( 'N', max_bw, max_bw, af( work_u+odd_size*bwl+1 ),
1045 $ max_bw, af( odd_size*bwu+2*mbw2+1 ), max_bw )
1046
1047 ELSE
1048 comm_proc = mycol + level_dist/2
1049 ENDIF
1050
1051 IF( mycol/level_dist .LE. (npcol-1)/level_dist-2 )THEN
1052
1053 CALL cgerv2d( ictxt, max_bw, max_bw,
1054 $ af( odd_size*bwu+1 ),
1055 $ max_bw, 0, comm_proc )
1056
1057 CALL cgerv2d( ictxt, max_bw, max_bw,
1058 $ af( work_u+odd_size*bwl+1 ),
1059 $ max_bw, 0, comm_proc )
1060
1061 IF( info .EQ. 0 ) THEN
1062
1063
1064
1065
1066
1067 CALL ctbtrs(
1068 $
'L',
'N',
'U', bwu,
min( bwl, bwu-1 ), bwu,
1069 $ af( odd_size*bwu+
1070 $ mbw2+1+(max_bw+1)*(max_bw-bwu)), max_bw+1,
1071 $ af( work_u+odd_size*bwl+1+max_bw-bwu), max_bw, info )
1072
1073
1074
1075
1076 CALL ctbtrs(
1077 $
'U',
'C',
'N', bwl,
min( bwu, bwl-1 ), bwl,
1078 $ af( odd_size*bwu+
1079 $ mbw2+1-
min( bwu, bwl-1 )+(max_bw+1)*(max_bw-bwl)), max_bw+1,
1080 $ af( odd_size*bwu+1+max_bw-bwl), max_bw, info )
1081
1082 ENDIF
1083
1084
1085
1086
1087 CALL cgemm( 'C', 'N', max_bw, max_bw, max_bw, -cone,
1088 $ af( (odd_size)*bwu+1 ), max_bw,
1089 $ af( work_u+(odd_size)*bwl+1 ), max_bw, czero,
1090 $ work( 1 ), max_bw )
1091
1092
1093
1094 CALL cgesd2d( ictxt, max_bw, max_bw, work( 1 ), max_bw,
1095 $ 0, mycol+level_dist )
1096
1097 ENDIF
1098
1099
1100
1101
1102
1103
1104
1105 IF( (mycol/level_dist .GT. 0 ).AND.
1106 $ ( mycol/level_dist .LE. (npcol-1)/level_dist-1 ) ) THEN
1107
1108 IF( level_dist .GT. 1)THEN
1109
1110
1111
1112
1113 CALL cgerv2d( ictxt, max_bw, max_bw,
1114 $ af( work_u+odd_size*bwl+2*mbw2+1 ),
1115 $ max_bw, 0, mycol-level_dist/2 )
1116
1117
1118
1119
1120 CALL cgerv2d( ictxt, max_bw, max_bw,
1121 $ af( odd_size*bwu+2*mbw2+1 ),
1122 $ max_bw, 0, mycol-level_dist/2 )
1123
1124 ENDIF
1125
1126
1127 IF( info.EQ.0 ) THEN
1128
1129
1130
1131
1132
1133
1134 CALL clatcpy(
'N', max_bw, max_bw, af( work_u+odd_size*bwl+
1135 $ 2*mbw2+1), max_bw, work( 1 ), max_bw )
1136
1137 CALL ctbtrs(
1138 $
'L',
'N',
'U', max_bw,
min( bwl, max_bw-1 ), bwl,
1139 $ af( odd_size*bwu+mbw2+1), max_bw+1,
1140 $ work( 1+max_bw*(max_bw-bwl) ), max_bw, info )
1141
1142
1143
1145 $ 'N', max_bw, max_bw, work( 1 ), max_bw,
1146 $ af( work_u+odd_size*bwl+
1147 $ 2*mbw2+1), max_bw )
1148
1149
1150
1151
1152
1153 CALL clatcpy(
'N', max_bw, max_bw, af( odd_size*bwu+
1154 $ 2*mbw2+1), max_bw, work( 1 ), max_bw )
1155
1156 CALL ctbtrs(
1157 $
'U',
'C',
'N', max_bw,
min( bwu, max_bw-1 ), bwu,
1158 $ af( odd_size*bwu+mbw2+1-
min( bwu, max_bw-1 )), max_bw+1,
1159 $ work( 1+max_bw*(max_bw-bwu) ), max_bw, info )
1160
1161
1162
1164 $ 'N', max_bw, max_bw, work( 1 ), max_bw,
1165 $ af( odd_size*bwu+
1166 $ 2*mbw2+1), max_bw )
1167
1168
1169 ENDIF
1170
1171
1172
1173
1174
1175 CALL cgemm( 'N', 'C', max_bw, max_bw, max_bw, -cone,
1176 $ af( (odd_size)*bwu+2*mbw2+1 ), max_bw,
1177 $ af( work_u+(odd_size)*bwl+2*mbw2+1 ), max_bw,
1178 $ czero, work( 1 ), max_bw )
1179
1180
1181
1182 CALL cgesd2d( ictxt, max_bw, max_bw, work( 1 ), max_bw,
1183 $ 0, mycol-level_dist )
1184
1185
1186
1187 IF( mycol/level_dist .LE. (npcol-1)/level_dist-2 ) THEN
1188
1189
1190
1191 IF( ( mod( mycol/( 2*level_dist ),2 )) .EQ.0 ) THEN
1192 comm_proc = mycol + level_dist
1193 ELSE
1194 comm_proc = mycol - level_dist
1195 ENDIF
1196
1197
1198
1199
1200
1201 CALL cgemm( 'N', 'N', max_bw, max_bw, max_bw, -cone,
1202 $ af( work_u+odd_size*bwl+2*mbw2+1 ), max_bw,
1203 $ af( odd_size*bwu+1 ), max_bw, czero,
1204 $ work( 1 ), max_bw )
1205
1206
1207
1208 CALL cgesd2d( ictxt, max_bw, max_bw, work( 1 ), max_bw,
1209 $ 0, comm_proc )
1210
1211 CALL cgemm( 'N', 'N', max_bw, max_bw, max_bw, -cone,
1212 $ af( odd_size*bwu+2*mbw2+1 ), max_bw,
1213 $ af( work_u+odd_size*bwl+1 ), max_bw, czero,
1214 $ work( 1 ), max_bw )
1215
1216
1217
1218 CALL cgesd2d( ictxt, max_bw, max_bw, work( 1 ), max_bw,
1219 $ 0, comm_proc )
1220
1221 ENDIF
1222
1223 ENDIF
1224
1225
1226 14 CONTINUE
1227
1228
1229 1000 CONTINUE
1230
1231
1232
1233
1234 IF( ictxt_save .NE. ictxt_new ) THEN
1235 CALL blacs_gridexit( ictxt_new )
1236 ENDIF
1237
1238 1234 CONTINUE
1239
1240
1241
1242 ictxt = ictxt_save
1243 np = np_save
1244
1245
1246
1247 work( 1 ) = work_size_min
1248
1249
1250
1251 CALL igamx2d( ictxt, 'A', ' ', 1, 1, info, 1, info, info,
1252 $ -1, 0, 0 )
1253
1254 IF( mycol.EQ.0 ) THEN
1255 CALL igebs2d( ictxt, 'A', ' ', 1, 1, info, 1 )
1256 ELSE
1257 CALL igebr2d( ictxt, 'A', ' ', 1, 1, info, 1, 0, 0 )
1258 ENDIF
1259
1260
1261 RETURN
1262
1263
1264
subroutine cdbtrf(m, n, kl, ku, ab, ldab, info)
subroutine clatcpy(uplo, m, n, a, lda, b, ldb)
subroutine desc_convert(desc_in, desc_out, info)
integer function numroc(n, nb, iproc, isrcproc, nprocs)
subroutine globchk(ictxt, n, x, ldx, iwork, info)
subroutine pxerbla(ictxt, srname, info)
void reshape(Int *context_in, Int *major_in, Int *context_out, Int *major_out, Int *first_proc, Int *nprow_new, Int *npcol_new)