25 integer(kind=kint) :: N
26 real(kind=
kreal),
pointer :: d(:) => null()
27 real(kind=
kreal),
pointer :: al(:) => null()
28 real(kind=
kreal),
pointer :: au(:) => null()
29 integer(kind=kint),
pointer :: indexL(:) => null()
30 integer(kind=kint),
pointer :: indexU(:) => null()
31 integer(kind=kint),
pointer :: itemL(:) => null()
32 integer(kind=kint),
pointer :: itemU(:) => null()
33 real(kind=
kreal),
pointer :: alu(:) => null()
35 integer(kind=kint) :: NColor
36 integer(kind=kint),
pointer :: COLORindex(:) => null()
37 integer(kind=kint),
pointer :: perm(:) => null()
38 integer(kind=kint),
pointer :: iperm(:) => null()
40 logical,
save :: isFirst = .true.
42 logical,
save :: INITIALIZED = .false.
49 integer(kind=kint ) :: npl, npu, npcl, npcu
50 real (kind=
kreal),
allocatable :: cd(:)
51 integer(kind=kint ) :: ncolor_in
52 real (kind=
kreal) :: sigma_diag
53 real (kind=
kreal) :: alutmp(1,1), pw(1)
54 integer(kind=kint ) :: ii, i, j, k
55 integer(kind=kint ) :: nthreads = 1
56 integer(kind=kint ),
allocatable :: perm_tmp(:)
63 if (hecmat%Iarray(98) == 1)
then
65 else if (hecmat%Iarray(97) == 1)
then
79 if (nthreads == 1)
then
81 allocate(colorindex(0:1), perm(n), iperm(n))
89 allocate(colorindex(0:n), perm_tmp(n), perm(n), iperm(n))
91 hecmat%indexU, hecmat%itemU, perm_tmp, iperm)
94 hecmat%indexU, hecmat%itemU, perm_tmp, &
95 ncolor_in, ncolor, colorindex, perm, iperm)
102 npl = hecmat%indexL(n)
103 npu = hecmat%indexU(n)
104 allocate(indexl(0:n), indexu(0:n), iteml(npl), itemu(npu))
106 hecmat%indexL, hecmat%indexU, hecmat%itemL, hecmat%itemU, &
107 indexl, indexu, iteml, itemu)
112 allocate(d(n), al(npl), au(npu))
114 hecmat%indexL, hecmat%indexU, hecmat%itemL, hecmat%itemU, &
115 hecmat%AL, hecmat%AU, hecmat%D, &
116 indexl, indexu, iteml, itemu, al, au, d)
132 alutmp(1,1)= alu(ii) * sigma_diag
133 alutmp(1,1)= 1.d0/alutmp(1,1)
142 hecmat%Iarray(98) = 0
143 hecmat%Iarray(97) = 0
152 real(kind=
kreal),
intent(inout) :: zp(:)
153 integer(kind=kint) :: ic, i, iold, j, isl, iel, isu, ieu, k
154 real(kind=
kreal) :: sw(1), x(1)
157 integer(kind=kint),
parameter :: numofblockperthread = 100
158 integer(kind=kint),
save :: numofthread = 1, numofblock
159 integer(kind=kint),
save,
allocatable :: ictoblockindex(:)
160 integer(kind=kint),
save,
allocatable :: blockindextocolorindex(:)
161 integer(kind=kint),
save :: sectorcachesize0, sectorcachesize1
162 integer(kind=kint) :: blockindex, elementcount, numofelement, ii
163 real(kind=
kreal) :: numofelementperblock
164 integer(kind=kint) :: my_rank
168 numofblock = numofthread * numofblockperthread
169 if (
allocated(ictoblockindex))
deallocate(ictoblockindex)
170 if (
allocated(blockindextocolorindex))
deallocate(blockindextocolorindex)
171 allocate (ictoblockindex(0:ncolor), &
172 blockindextocolorindex(0:numofblock + ncolor))
173 numofelement = n + indexl(n) + indexu(n)
174 numofelementperblock = dble(numofelement) / numofblock
177 ictoblockindex(0) = 0
178 blockindextocolorindex = -1
179 blockindextocolorindex(0) = 0
188 do i = colorindex(ic-1)+1, colorindex(ic)
189 elementcount = elementcount + 1
190 elementcount = elementcount + (indexl(i) - indexl(i-1))
191 elementcount = elementcount + (indexu(i) - indexu(i-1))
192 if (elementcount > ii * numofelementperblock &
193 .or. i == colorindex(ic))
then
195 blockindex = blockindex + 1
196 blockindextocolorindex(blockindex) = i
201 ictoblockindex(ic) = blockindex
203 numofblock = blockindex
206 sectorcachesize0, sectorcachesize1 )
225 do blockindex = ictoblockindex(ic-1)+1, ictoblockindex(ic)
226 do i = blockindextocolorindex(blockindex-1)+1, &
227 blockindextocolorindex(blockindex)
235 sw(1)= sw(1) - al(j)*x(1)
249 do blockindex = ictoblockindex(ic), ictoblockindex(ic-1)+1, -1
250 do i = blockindextocolorindex(blockindex), &
251 blockindextocolorindex(blockindex-1)+1, -1
262 sw(1)= sw(1) + au(j)*x(1)
269 zp(iold)= zp(iold) - x(1)
286 integer(kind=kint ) :: nthreads = 1
288 if (
associated(colorindex))
deallocate(colorindex)
289 if (
associated(perm))
deallocate(perm)
290 if (
associated(iperm))
deallocate(iperm)
291 if (
associated(alu))
deallocate(alu)
292 if (nthreads >= 1)
then
293 if (
associated(d))
deallocate(d)
294 if (
associated(al))
deallocate(al)
295 if (
associated(au))
deallocate(au)
296 if (
associated(indexl))
deallocate(indexl)
297 if (
associated(indexu))
deallocate(indexu)
298 if (
associated(iteml))
deallocate(iteml)
299 if (
associated(itemu))
deallocate(itemu)
312 initialized = .false.
315 subroutine write_debug_info
317 integer(kind=kint) :: my_rank, ic, in
320 if (my_rank.eq.0)
then
321 write(*,*)
'DEBUG: Output fort.19000+myrank and fort.29000+myrank for coloring information'
323 write(19000+my_rank,
'(a)')
'#NCOLORTot'
324 write(19000+my_rank,*) ncolor
325 write(19000+my_rank,
'(a)')
'#ic COLORindex(ic-1)+1 COLORindex(ic)'
327 write(19000+my_rank,*) ic, colorindex(ic-1)+1,colorindex(ic)
329 write(29000+my_rank,
'(a)')
'#n_node'
330 write(29000+my_rank,*) n
331 write(29000+my_rank,
'(a)')
'#in OLDtoNEW(in) NEWtoOLD(in)'
333 write(29000+my_rank,*) in, iperm(in), perm(in)
334 if (perm(iperm(in)) .ne. in)
then
335 write(29000+my_rank,*)
'** WARNING **: NEWtoOLD and OLDtoNEW: ',in
338 end subroutine write_debug_info
340 subroutine check_ordering
342 integer(kind=kint) :: ic, i, j, k
343 integer(kind=kint),
allocatable :: iicolor(:)
345 if (ncolor.gt.1)
then
348 do i= colorindex(ic-1)+1, colorindex(ic)
354 do i= colorindex(ic-1)+1, colorindex(ic)
355 do j= indexl(i-1)+1, indexl(i)
357 if (iicolor(i).eq.iicolor(k))
then
358 write(*,*) .eq.
'** ERROR **: L-part: iicolor(i)iicolor(k)',i,k,iicolor(i)
365 do i= colorindex(ic), colorindex(ic-1)+1, -1
366 do j= indexu(i-1)+1, indexu(i)
368 if (iicolor(i).eq.iicolor(k))
then
369 write(*,*) .eq.
'** ERROR **: U-part: iicolor(i)iicolor(k)',i,k,iicolor(i)
377 end subroutine check_ordering