xref: /phasta/svLS/LHS.f (revision 712d3df0b59ebebaaeaea358162c8d2c043c6e08)
1*1e99f302SBen Matthews!     This software is Copyright (c) 2012-2015 The Regents of the
2*1e99f302SBen Matthews!     University of California. All Rights Reserved.
3*1e99f302SBen Matthews!
4*1e99f302SBen Matthews!     Permission to copy and modify this software and its documentation
5*1e99f302SBen Matthews!     for educational, research and non-profit purposes, without fee,
6*1e99f302SBen Matthews!     and without a written agreement is hereby granted, provided that
7*1e99f302SBen Matthews!     the above copyright notice, this paragraph and the following three
8*1e99f302SBen Matthews!     paragraphs appear in all copies.
9*1e99f302SBen Matthews!
10*1e99f302SBen Matthews!     Permission to make commercial use of this software may be obtained
11*1e99f302SBen Matthews!     by contacting:
12*1e99f302SBen Matthews!
13*1e99f302SBen Matthews!     Technology Transfer Office
14*1e99f302SBen Matthews!     9500 Gilman Drive, Mail Code 0910
15*1e99f302SBen Matthews!     University of California
16*1e99f302SBen Matthews!     La Jolla, CA 92093-0910
17*1e99f302SBen Matthews!     (858) 534-5815
18*1e99f302SBen Matthews!     invent@ucsd.edu
19*1e99f302SBen Matthews!
20*1e99f302SBen Matthews!     This software program and documentation are copyrighted by The
21*1e99f302SBen Matthews!     Regents of the University of California. The software program and
22*1e99f302SBen Matthews!     documentation are supplied "as is", without any accompanying
23*1e99f302SBen Matthews!     services from The Regents. The Regents does not warrant that the
24*1e99f302SBen Matthews!     operation of the program will be uninterrupted or error-free. The
25*1e99f302SBen Matthews!     end-user understands that the program was developed for research
26*1e99f302SBen Matthews!     purposes and is advised not to rely exclusively on the program for
27*1e99f302SBen Matthews!     any reason.
28*1e99f302SBen Matthews!
29*1e99f302SBen Matthews!     IN NO EVENT SHALL THE UNIVERSITY OF CALIFORNIA BE LIABLE TO ANY
30*1e99f302SBen Matthews!     PARTY FOR DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL
31*1e99f302SBen Matthews!     DAMAGES, INCLUDING LOST PROFITS, ARISING OUT OF THE USE OF THIS
32*1e99f302SBen Matthews!     SOFTWARE AND ITS DOCUMENTATION, EVEN IF THE UNIVERSITY OF
33*1e99f302SBen Matthews!     CALIFORNIA HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
34*1e99f302SBen Matthews!     THE UNIVERSITY OF CALIFORNIA SPECIFICALLY DISCLAIMS ANY
35*1e99f302SBen Matthews!     WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
36*1e99f302SBen Matthews!     OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. THE
37*1e99f302SBen Matthews!     SOFTWARE PROVIDED HEREUNDER IS ON AN "AS IS" BASIS, AND THE
38*1e99f302SBen Matthews!     UNIVERSITY OF CALIFORNIA HAS NO OBLIGATIONS TO PROVIDE
39*1e99f302SBen Matthews!     MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
40*1e99f302SBen Matthews
41*1e99f302SBen Matthews      SUBROUTINE svLS_LHS_CREATE(lhs, commu, gnNo, nNo, nnz, gNodes,
42*1e99f302SBen Matthews     2   rowPtr, colPtr, nFaces)
43*1e99f302SBen Matthews
44*1e99f302SBen Matthews      INCLUDE "svLS_STD.h"
45*1e99f302SBen Matthews
46*1e99f302SBen Matthews      TYPE(svLS_lhsType), INTENT(INOUT) :: lhs
47*1e99f302SBen Matthews      TYPE(svLS_commuType), INTENT(IN) :: commu
48*1e99f302SBen Matthews      INTEGER, INTENT(IN) :: gnNo, nNo, nnz
49*1e99f302SBen Matthews      INTEGER, INTENT(IN) :: gNodes(nNo), rowPtr(nNo+1), colPtr(nnz)
50*1e99f302SBen Matthews      INTEGER, INTENT(IN) :: nFaces
51*1e99f302SBen Matthews
52*1e99f302SBen Matthews      INTEGER i, j, k, a, Ac, ai, s, e, nTasks, tF, maxnNo, ierr,
53*1e99f302SBen Matthews     2   stat(MPI_STATUS_SIZE)
54*1e99f302SBen Matthews
55*1e99f302SBen Matthews      INTEGER comm
56*1e99f302SBen Matthews      INTEGER, ALLOCATABLE :: aNodes(:,:), gtlPtr(:), ltg(:),
57*1e99f302SBen Matthews     2   part(:), sCount(:), disp(:)
58*1e99f302SBen Matthews
59*1e99f302SBen Matthews      IF (lhs%foC) THEN
60*1e99f302SBen Matthews         PRINT *, "LHS is not free"
61*1e99f302SBen Matthews         PRINT *, "You may use svLS_LHS_FREE to free this structure"
62*1e99f302SBen Matthews      END IF
63*1e99f302SBen Matthews
64*1e99f302SBen Matthews      lhs%foC    = .TRUE.
65*1e99f302SBen Matthews      lhs%gnNo   = gnNo
66*1e99f302SBen Matthews      lhs%nNo    = nNo
67*1e99f302SBen Matthews      lhs%nnz    = nnz
68*1e99f302SBen Matthews      lhs%commu  = commu
69*1e99f302SBen Matthews      lhs%nFaces = nFaces
70*1e99f302SBen Matthews
71*1e99f302SBen Matthews      nTasks = commu%nTasks
72*1e99f302SBen Matthews      comm   = commu%comm
73*1e99f302SBen Matthews      tF     = commu%tF
74*1e99f302SBen Matthews
75*1e99f302SBen Matthews      ALLOCATE (lhs%colPtr(nnz), lhs%rowPtr(2,nNo), lhs%diagPtr(nNo),
76*1e99f302SBen Matthews     2   lhs%map(nNo), lhs%cS(nTasks), lhs%face(nFaces))
77*1e99f302SBen Matthews
78*1e99f302SBen Matthews      IF (nTasks .EQ. 1) THEN
79*1e99f302SBen Matthews         DO i=1, nnz
80*1e99f302SBen Matthews            lhs%colPtr(i) = colPtr(i)
81*1e99f302SBen Matthews         END DO
82*1e99f302SBen Matthews         DO Ac=1, nNo
83*1e99f302SBen Matthews            s = rowPtr(Ac)
84*1e99f302SBen Matthews            e = rowPtr(Ac+1) - 1
85*1e99f302SBen Matthews            DO i=s, e
86*1e99f302SBen Matthews               a = colPtr(i)
87*1e99f302SBen Matthews               IF (Ac .EQ. a) THEN
88*1e99f302SBen Matthews                  lhs%diagPtr(Ac) = i
89*1e99f302SBen Matthews                  EXIT
90*1e99f302SBen Matthews               END IF
91*1e99f302SBen Matthews            END DO
92*1e99f302SBen Matthews
93*1e99f302SBen Matthews            lhs%rowPtr(1,Ac) = s
94*1e99f302SBen Matthews            lhs%rowPtr(2,Ac) = e
95*1e99f302SBen Matthews
96*1e99f302SBen Matthews            lhs%map(Ac) = Ac
97*1e99f302SBen Matthews         END DO
98*1e99f302SBen Matthews
99*1e99f302SBen Matthews         lhs%mynNo = nNo
100*1e99f302SBen Matthews         RETURN
101*1e99f302SBen Matthews      END IF
102*1e99f302SBen Matthews
103*1e99f302SBen Matthews      CALL MPI_ALLREDUCE (nNo, maxnNo, 1, mpint, MPI_MAX, comm, ierr)
104*1e99f302SBen Matthews
105*1e99f302SBen Matthews      ALLOCATE(aNodes(maxnNo,nTasks), part(maxnNo), sCount(nTasks),
106*1e99f302SBen Matthews     2   disp(nTasks), gtlPtr(gnNo), ltg(nNo))
107*1e99f302SBen Matthews
108*1e99f302SBen Matthews      part = 0
109*1e99f302SBen Matthews      part(1:nNo) = gNodes
110*1e99f302SBen Matthews
111*1e99f302SBen Matthews      DO i=1, nTasks
112*1e99f302SBen Matthews         disp(i)   = (i-1)*maxnNo
113*1e99f302SBen Matthews         sCount(i) = maxnNo
114*1e99f302SBen Matthews      END DO
115*1e99f302SBen Matthews
116*1e99f302SBen Matthews      CALL MPI_ALLGATHERV(part, maxnNo, mpint, aNodes, sCount, disp,
117*1e99f302SBen Matthews     2   mpint, comm, ierr)
118*1e99f302SBen Matthews
119*1e99f302SBen Matthews      gtlPtr = 0
120*1e99f302SBen Matthews      DO a=1, nNo
121*1e99f302SBen Matthews         Ac = gNodes(a)
122*1e99f302SBen Matthews         gtlPtr(Ac) = a
123*1e99f302SBen Matthews      END DO
124*1e99f302SBen Matthews
125*1e99f302SBen Matthews      DO i=nTasks, 1, -1
126*1e99f302SBen Matthews         IF (i .EQ. tF) CYCLE
127*1e99f302SBen Matthews
128*1e99f302SBen Matthews         DO a=1, maxnNo
129*1e99f302SBen Matthews            Ac = aNodes(a,i)
130*1e99f302SBen Matthews            IF (Ac .EQ. 0) EXIT
131*1e99f302SBen Matthews            ai = gtlPtr(Ac)
132*1e99f302SBen Matthews            IF (ai .NE. 0) THEN
133*1e99f302SBen Matthews               IF (aNodes(ai,tF) .NE. 0) THEN
134*1e99f302SBen Matthews                  IF (i .GT. tF) aNodes(ai,tF) = 0
135*1e99f302SBen Matthews               ELSE
136*1e99f302SBen Matthews                  aNodes(a,i) = 0
137*1e99f302SBen Matthews               END IF
138*1e99f302SBen Matthews            ELSE
139*1e99f302SBen Matthews               aNodes(a,i) = 0
140*1e99f302SBen Matthews            END IF
141*1e99f302SBen Matthews         END DO
142*1e99f302SBen Matthews      END DO
143*1e99f302SBen Matthews
144*1e99f302SBen Matthews      j = 1
145*1e99f302SBen Matthews      lhs%cS(1)%ptr = 1
146*1e99f302SBen Matthews      DO i=1, nTasks
147*1e99f302SBen Matthews         lhs%cS(i)%n = 0
148*1e99f302SBen Matthews         lhs%cS(i)%ptr = j
149*1e99f302SBen Matthews         IF (i.NE.tF .AND. i.NE.1)  THEN
150*1e99f302SBen Matthews            lhs%cS(i)%ptr = lhs%cS(i-1)%ptr + lhs%cS(i-1)%n
151*1e99f302SBen Matthews         END IF
152*1e99f302SBen Matthews
153*1e99f302SBen Matthews         DO a=1, maxnNo
154*1e99f302SBen Matthews            Ac = aNodes(a,i)
155*1e99f302SBen Matthews            IF (Ac .NE. 0) THEN
156*1e99f302SBen Matthews               lhs%cS(i)%n = lhs%cS(i)%n + 1
157*1e99f302SBen Matthews               ai = gtlPtr(Ac)
158*1e99f302SBen Matthews               IF (i.GT.tF .OR. aNodes(ai,tF).NE.0) THEN
159*1e99f302SBen Matthews                  ltg(j) = Ac
160*1e99f302SBen Matthews                  j = j + 1
161*1e99f302SBen Matthews                  aNodes(ai,tF) = 0
162*1e99f302SBen Matthews               END IF
163*1e99f302SBen Matthews            END IF
164*1e99f302SBen Matthews         END DO
165*1e99f302SBen Matthews
166*1e99f302SBen Matthews         IF (i .LT. tF) THEN
167*1e99f302SBen Matthews            lhs%cS(i)%tag = nTasks*i  + tF
168*1e99f302SBen Matthews         ELSE
169*1e99f302SBen Matthews            lhs%cS(i)%tag = nTasks*tF + i
170*1e99f302SBen Matthews         END IF
171*1e99f302SBen Matthews         IF (lhs%cS(i)%n .EQ. 0) lhs%cS(i)%tag = 0
172*1e99f302SBen Matthews      END DO
173*1e99f302SBen Matthews
174*1e99f302SBen Matthews      lhs%cS(tF)%tag = 0
175*1e99f302SBen Matthews      lhs%mynNo = lhs%cS(tF)%ptr + lhs%cS(tF)%n - 1
176*1e99f302SBen Matthews
177*1e99f302SBen Matthews      gtlPtr = 0
178*1e99f302SBen Matthews      DO a=1, nNo
179*1e99f302SBen Matthews         Ac = ltg(a)
180*1e99f302SBen Matthews         gtlPtr(Ac) = a
181*1e99f302SBen Matthews      END DO
182*1e99f302SBen Matthews      DO a=1, nNo
183*1e99f302SBen Matthews         Ac = gNodes(a)
184*1e99f302SBen Matthews         lhs%map(a) = gtlPtr(Ac)
185*1e99f302SBen Matthews      END DO
186*1e99f302SBen Matthews
187*1e99f302SBen Matthews      DEALLOCATE(aNodes, part, gtlPtr, sCount, disp)
188*1e99f302SBen Matthews
189*1e99f302SBen Matthews      DO a=1, nNo
190*1e99f302SBen Matthews         Ac = lhs%map(a)
191*1e99f302SBen Matthews         lhs%rowPtr(1,Ac) = rowPtr(a)
192*1e99f302SBen Matthews         lhs%rowPtr(2,Ac) = rowPtr(a+1) - 1
193*1e99f302SBen Matthews      END DO
194*1e99f302SBen Matthews
195*1e99f302SBen Matthews      DO i=1, nnz
196*1e99f302SBen Matthews         lhs%colPtr(i) = lhs%map(colPtr(i))
197*1e99f302SBen Matthews      END DO
198*1e99f302SBen Matthews
199*1e99f302SBen Matthews      DO Ac=1, nNo
200*1e99f302SBen Matthews         DO i=lhs%rowPtr(1,Ac), lhs%rowPtr(2,Ac)
201*1e99f302SBen Matthews            a = lhs%colPtr(i)
202*1e99f302SBen Matthews            IF (Ac .EQ. a) THEN
203*1e99f302SBen Matthews               lhs%diagPtr(Ac) = i
204*1e99f302SBen Matthews               EXIT
205*1e99f302SBen Matthews            END IF
206*1e99f302SBen Matthews         END DO
207*1e99f302SBen Matthews      END DO
208*1e99f302SBen Matthews
209*1e99f302SBen Matthews      IF (tF .NE. 1) THEN
210*1e99f302SBen Matthews         i = tF - 1
211*1e99f302SBen Matthews         i = lhs%cS(i)%ptr + lhs%cS(i)%n - 1
212*1e99f302SBen Matthews         ALLOCATE(part(i))
213*1e99f302SBen Matthews      END IF
214*1e99f302SBen Matthews
215*1e99f302SBen Matthews      DO i=1, nTasks
216*1e99f302SBen Matthews         lhs%cS(i)%nBl = 0
217*1e99f302SBen Matthews         IF (lhs%cS(i)%tag .NE. 0) THEN
218*1e99f302SBen Matthews            s = lhs%cS(i)%ptr
219*1e99f302SBen Matthews            e = s + lhs%cS(i)%n - 1
220*1e99f302SBen Matthews            IF (i .LT. tF) THEN
221*1e99f302SBen Matthews               CALL MPI_RECV(part(s:e), lhs%cS(i)%n, mpint, i-1,
222*1e99f302SBen Matthews     2            lhs%cS(i)%tag, comm, stat, ierr)
223*1e99f302SBen Matthews
224*1e99f302SBen Matthews               k = 0
225*1e99f302SBen Matthews               DO j=s, e
226*1e99f302SBen Matthews                  k = k + 1
227*1e99f302SBen Matthews                  IF (part(j).NE.ltg(k) .OR. j.EQ.s) THEN
228*1e99f302SBen Matthews                     lhs%cS(i)%nBl = lhs%cS(i)%nBl + 1
229*1e99f302SBen Matthews                     DO k=1, lhs%cS(tF)%ptr
230*1e99f302SBen Matthews                        IF (part(j) .EQ. ltg(k)) EXIT
231*1e99f302SBen Matthews                     END DO
232*1e99f302SBen Matthews                  END IF
233*1e99f302SBen Matthews               END DO
234*1e99f302SBen Matthews               a = lhs%cS(i)%nBl
235*1e99f302SBen Matthews               ALLOCATE(lhs%cS(i)%blPtr(a), lhs%cS(i)%blN(a))
236*1e99f302SBen Matthews
237*1e99f302SBen Matthews               k = 0
238*1e99f302SBen Matthews               a = 0
239*1e99f302SBen Matthews               DO j=s, e
240*1e99f302SBen Matthews                  k = k + 1
241*1e99f302SBen Matthews                  IF (part(j).NE.ltg(k) .OR. j.EQ.s) THEN
242*1e99f302SBen Matthews                     a = a + 1
243*1e99f302SBen Matthews                     lhs%cS(i)%blN(a) = 1
244*1e99f302SBen Matthews                     DO k=1, lhs%cS(tF)%ptr
245*1e99f302SBen Matthews                        IF (part(j) .EQ. ltg(k)) THEN
246*1e99f302SBen Matthews                           lhs%cS(i)%blPtr(a) = k
247*1e99f302SBen Matthews                           EXIT
248*1e99f302SBen Matthews                        END IF
249*1e99f302SBen Matthews                     END DO
250*1e99f302SBen Matthews                  ELSE
251*1e99f302SBen Matthews                     lhs%cS(i)%blN(a) = lhs%cS(i)%blN(a) + 1
252*1e99f302SBen Matthews                  END IF
253*1e99f302SBen Matthews               END DO
254*1e99f302SBen Matthews            ELSE
255*1e99f302SBen Matthews               CALL MPI_SEND(ltg(s:e), lhs%cS(i)%n, mpint, i-1,
256*1e99f302SBen Matthews     2            lhs%cS(i)%tag, comm, stat, ierr)
257*1e99f302SBen Matthews            END IF
258*1e99f302SBen Matthews         END IF
259*1e99f302SBen Matthews      END DO
260*1e99f302SBen Matthews
261*1e99f302SBen Matthews      IF (ALLOCATED(part)) DEALLOCATE(part)
262*1e99f302SBen Matthews      DEALLOCATE(ltg)
263*1e99f302SBen Matthews
264*1e99f302SBen Matthews      RETURN
265*1e99f302SBen Matthews      END SUBROUTINE svLS_LHS_CREATE
266*1e99f302SBen Matthews
267*1e99f302SBen Matthews!====================================================================
268*1e99f302SBen Matthews
269*1e99f302SBen Matthews      SUBROUTINE svLS_LHS_FREE(lhs)
270*1e99f302SBen Matthews
271*1e99f302SBen Matthews      INCLUDE "svLS_STD.h"
272*1e99f302SBen Matthews
273*1e99f302SBen Matthews      TYPE(svLS_lhsType), INTENT(INOUT) :: lhs
274*1e99f302SBen Matthews
275*1e99f302SBen Matthews      INTEGER faIn, i
276*1e99f302SBen Matthews
277*1e99f302SBen Matthews      IF (.NOT.lhs%foC) THEN
278*1e99f302SBen Matthews         PRINT *, 'Cannot free LHS'
279*1e99f302SBen Matthews         PRINT *, 'It is not created yet'
280*1e99f302SBen Matthews         STOP
281*1e99f302SBen Matthews      END IF
282*1e99f302SBen Matthews
283*1e99f302SBen Matthews      DO faIn = 1, lhs%nFaces
284*1e99f302SBen Matthews         IF (lhs%face(faIn)%foC) CALL svLS_BC_FREE(lhs, faIn)
285*1e99f302SBen Matthews      END DO
286*1e99f302SBen Matthews
287*1e99f302SBen Matthews      DO i=1, lhs%commu%nTasks
288*1e99f302SBen Matthews         IF (ALLOCATED(lhs%cS(i)%blPtr)) THEN
289*1e99f302SBen Matthews            DEALLOCATE(lhs%cS(i)%blPtr, lhs%cS(i)%blN)
290*1e99f302SBen Matthews         END IF
291*1e99f302SBen Matthews      END DO
292*1e99f302SBen Matthews
293*1e99f302SBen Matthews      lhs%foC    = .FALSE.
294*1e99f302SBen Matthews      lhs%gnNo   = 0
295*1e99f302SBen Matthews      lhs%nNo    = 0
296*1e99f302SBen Matthews      lhs%nnz    = 0
297*1e99f302SBen Matthews      lhs%nFaces = 0
298*1e99f302SBen Matthews
299*1e99f302SBen Matthews      DEALLOCATE (lhs%colPtr, lhs%rowPtr, lhs%diagPtr, lhs%map, lhs%cS,
300*1e99f302SBen Matthews     2   lhs%face)
301*1e99f302SBen Matthews
302*1e99f302SBen Matthews      RETURN
303*1e99f302SBen Matthews      END SUBROUTINE svLS_LHS_FREE
304*1e99f302SBen Matthews
305*1e99f302SBen Matthews!====================================================================
306*1e99f302SBen Matthews
307*1e99f302SBen Matthews      SUBROUTINE svLS_LHS_CREATE_C(pLHS, commu, gnNo, nNo, nnz, gNodes,
308*1e99f302SBen Matthews     2   rowPtr, colPtr, nFaces)
309*1e99f302SBen Matthews
310*1e99f302SBen Matthews      INCLUDE "svLS_STD.h"
311*1e99f302SBen Matthews
312*1e99f302SBen Matthews      TYPE(svLS_lhsType), POINTER, INTENT(OUT) :: pLHS
313*1e99f302SBen Matthews      TYPE(svLS_commuType), INTENT(IN) :: commu
314*1e99f302SBen Matthews      INTEGER, INTENT(IN) :: gnNo, nNo, nnz
315*1e99f302SBen Matthews      INTEGER, INTENT(IN) :: gNodes(nNo), rowPtr(nNo+1), colPtr(nnz)
316*1e99f302SBen Matthews      INTEGER, INTENT(IN) :: nFaces
317*1e99f302SBen Matthews
318*1e99f302SBen Matthews      TYPE(svLS_lhsType), TARGET, SAVE :: lhs
319*1e99f302SBen Matthews
320*1e99f302SBen Matthews      CALL svLS_LHS_CREATE(lhs, commu, gnNo, nNo, nnz, gNodes,
321*1e99f302SBen Matthews     2   rowPtr, colPtr, nFaces)
322*1e99f302SBen Matthews
323*1e99f302SBen Matthews      pLHS => lhs
324*1e99f302SBen Matthews
325*1e99f302SBen Matthews      RETURN
326*1e99f302SBen Matthews      END SUBROUTINE svLS_LHS_CREATE_C
327