xref: /libCEED/backends/ref/ceed-ref-operator.c (revision 8d94b0593ef54c33797e8bc6482f658a5be1664c)
121617c04Sjeremylt // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC.
221617c04Sjeremylt // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707.
321617c04Sjeremylt // All Rights reserved. See files LICENSE and NOTICE for details.
421617c04Sjeremylt //
521617c04Sjeremylt // This file is part of CEED, a collection of benchmarks, miniapps, software
621617c04Sjeremylt // libraries and APIs for efficient high-order finite element and spectral
721617c04Sjeremylt // element discretizations for exascale applications. For more information and
821617c04Sjeremylt // source code availability see http://github.com/ceed.
921617c04Sjeremylt //
1021617c04Sjeremylt // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
1121617c04Sjeremylt // a collaborative effort of two U.S. Department of Energy organizations (Office
1221617c04Sjeremylt // of Science and the National Nuclear Security Administration) responsible for
1321617c04Sjeremylt // the planning and preparation of a capable exascale ecosystem, including
1421617c04Sjeremylt // software, applications, hardware, advanced system engineering and early
1521617c04Sjeremylt // testbed platforms, in support of the nation's exascale computing imperative.
1621617c04Sjeremylt 
1721617c04Sjeremylt #include <ceed-impl.h>
1821617c04Sjeremylt #include <string.h>
1921617c04Sjeremylt #include "ceed-ref.h"
2021617c04Sjeremylt 
2121617c04Sjeremylt static int CeedOperatorDestroy_Ref(CeedOperator op) {
2221617c04Sjeremylt   CeedOperator_Ref *impl = op->data;
2321617c04Sjeremylt   int ierr;
2421617c04Sjeremylt 
25885ac19cSjeremylt   for (CeedInt i=0; i<impl->numein+impl->numeout; i++) {
26885ac19cSjeremylt     ierr = CeedVectorDestroy(&impl->evecs[i]); CeedChk(ierr);
27885ac19cSjeremylt   }
28885ac19cSjeremylt   ierr = CeedFree(&impl->evecs); CeedChk(ierr);
29885ac19cSjeremylt   ierr = CeedFree(&impl->edata); CeedChk(ierr);
30885ac19cSjeremylt 
31885ac19cSjeremylt   for (CeedInt i=0; i<impl->numqin+impl->numqout; i++) {
32885ac19cSjeremylt     ierr = CeedFree(&impl->qdata_alloc[i]); CeedChk(ierr);
33885ac19cSjeremylt   }
34885ac19cSjeremylt   ierr = CeedFree(&impl->qdata_alloc); CeedChk(ierr);
35885ac19cSjeremylt   ierr = CeedFree(&impl->qdata); CeedChk(ierr);
36885ac19cSjeremylt 
37885ac19cSjeremylt   ierr = CeedFree(&impl->indata); CeedChk(ierr);
38885ac19cSjeremylt   ierr = CeedFree(&impl->outdata); CeedChk(ierr);
39885ac19cSjeremylt 
4021617c04Sjeremylt   ierr = CeedFree(&op->data); CeedChk(ierr);
4121617c04Sjeremylt   return 0;
4221617c04Sjeremylt }
4321617c04Sjeremylt 
44885ac19cSjeremylt /*
45885ac19cSjeremylt   Setup infields or outfields
46885ac19cSjeremylt  */
47885ac19cSjeremylt static int CeedOperatorSetupFields_Ref(struct CeedQFunctionField qfields[16],
48885ac19cSjeremylt                                        struct CeedOperatorField ofields[16],
49885ac19cSjeremylt                                        CeedVector *evecs, CeedScalar **qdata,
50885ac19cSjeremylt                                        CeedScalar **qdata_alloc, CeedScalar **indata,
51135a076eSjeremylt                                        CeedInt starti, CeedInt startq,
52135a076eSjeremylt                                        CeedInt numfields, CeedInt Q) {
53135a076eSjeremylt   CeedInt dim, ierr, iq=startq, ncomp;
5421617c04Sjeremylt 
55885ac19cSjeremylt   // Loop over fields
56885ac19cSjeremylt   for (CeedInt i=0; i<numfields; i++) {
57885ac19cSjeremylt     CeedEvalMode emode = qfields[i].emode;
58135a076eSjeremylt 
59135a076eSjeremylt     if (emode != CEED_EVAL_WEIGHT) {
60135a076eSjeremylt       ierr = CeedElemRestrictionCreateVector(ofields[i].Erestrict, NULL, &evecs[i+starti]);
61135a076eSjeremylt       CeedChk(ierr);
62135a076eSjeremylt     }
63135a076eSjeremylt 
64885ac19cSjeremylt     switch(emode) {
65885ac19cSjeremylt     case CEED_EVAL_NONE:
66885ac19cSjeremylt       break; // No action
67885ac19cSjeremylt     case CEED_EVAL_INTERP:
68885ac19cSjeremylt       ncomp = qfields[i].ncomp;
69885ac19cSjeremylt       ierr = CeedMalloc(Q*ncomp, &qdata_alloc[iq]); CeedChk(ierr);
70885ac19cSjeremylt       qdata[i + starti] = qdata_alloc[iq];
71885ac19cSjeremylt       iq++;
72885ac19cSjeremylt       break;
73885ac19cSjeremylt     case CEED_EVAL_GRAD:
74885ac19cSjeremylt       ncomp = qfields[i].ncomp;
75885ac19cSjeremylt       dim = ofields[i].basis->dim;
76885ac19cSjeremylt       ierr = CeedMalloc(Q*ncomp*dim, &qdata_alloc[iq]); CeedChk(ierr);
77885ac19cSjeremylt       qdata[i + starti] = qdata_alloc[iq];
78885ac19cSjeremylt       iq++;
79885ac19cSjeremylt       break;
80885ac19cSjeremylt     case CEED_EVAL_WEIGHT: // Only on input fields
81885ac19cSjeremylt       ierr = CeedMalloc(Q, &qdata_alloc[iq]); CeedChk(ierr);
82d3181881Sjeremylt       ierr = CeedBasisApply(ofields[iq].basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT,
83885ac19cSjeremylt                             NULL, qdata_alloc[iq]); CeedChk(ierr);
84885ac19cSjeremylt       qdata[i] = qdata_alloc[iq];
85885ac19cSjeremylt       indata[i] = qdata[i];
86885ac19cSjeremylt       iq++;
87885ac19cSjeremylt       break;
88885ac19cSjeremylt     case CEED_EVAL_DIV:
89885ac19cSjeremylt       break; // Not implimented
90885ac19cSjeremylt     case CEED_EVAL_CURL:
91885ac19cSjeremylt       break; // Not implimented
9221617c04Sjeremylt     }
93885ac19cSjeremylt   }
9421617c04Sjeremylt   return 0;
9521617c04Sjeremylt }
9621617c04Sjeremylt 
97885ac19cSjeremylt /*
98885ac19cSjeremylt   CeedOperator needs to connect all the named fields (be they active or passive)
99885ac19cSjeremylt   to the named inputs and outputs of its CeedQFunction.
100885ac19cSjeremylt  */
101885ac19cSjeremylt static int CeedOperatorSetup_Ref(CeedOperator op) {
102885ac19cSjeremylt   if (op->setupdone) return 0;
103a2b73c81Sjeremylt   CeedOperator_Ref *impl = op->data;
104885ac19cSjeremylt   CeedQFunction qf = op->qf;
105885ac19cSjeremylt   CeedInt Q = op->numqpoints;
10621617c04Sjeremylt   int ierr;
10721617c04Sjeremylt 
108885ac19cSjeremylt   // Count infield and outfield array sizes and evectors
109a2b73c81Sjeremylt   impl->numein = qf->numinputfields;
110885ac19cSjeremylt   for (CeedInt i=0; i<qf->numinputfields; i++) {
111885ac19cSjeremylt     CeedEvalMode emode = qf->inputfields[i].emode;
112*8d94b059Sjeremylt     impl->numqin += !!(emode & CEED_EVAL_INTERP) + !!(emode & CEED_EVAL_GRAD) +
113*8d94b059Sjeremylt                     !!(emode & CEED_EVAL_WEIGHT);
11421617c04Sjeremylt   }
115a2b73c81Sjeremylt   impl->numeout = qf->numoutputfields;
116885ac19cSjeremylt   for (CeedInt i=0; i<qf->numoutputfields; i++) {
117885ac19cSjeremylt     CeedEvalMode emode = qf->outputfields[i].emode;
118a2b73c81Sjeremylt     impl->numqout += !!(emode & CEED_EVAL_INTERP) + !!(emode & CEED_EVAL_GRAD);
119885ac19cSjeremylt   }
120885ac19cSjeremylt 
121885ac19cSjeremylt   // Allocate
122a2b73c81Sjeremylt   ierr = CeedCalloc(impl->numein + impl->numeout, &impl->evecs); CeedChk(ierr);
123a2b73c81Sjeremylt   ierr = CeedCalloc(impl->numein + impl->numeout, &impl->edata);
124885ac19cSjeremylt   CeedChk(ierr);
125885ac19cSjeremylt 
126a2b73c81Sjeremylt   ierr = CeedCalloc(impl->numqin + impl->numqout, &impl->qdata_alloc);
127885ac19cSjeremylt   CeedChk(ierr);
128a2b73c81Sjeremylt   ierr = CeedCalloc(qf->numinputfields + qf->numoutputfields, &impl->qdata);
129885ac19cSjeremylt   CeedChk(ierr);
130885ac19cSjeremylt 
131a2b73c81Sjeremylt   ierr = CeedCalloc(16, &impl->indata); CeedChk(ierr);
132a2b73c81Sjeremylt   ierr = CeedCalloc(16, &impl->outdata); CeedChk(ierr);
133885ac19cSjeremylt 
134885ac19cSjeremylt   // Set up infield and outfield pointer arrays
135885ac19cSjeremylt   // Infields
136885ac19cSjeremylt   ierr = CeedOperatorSetupFields_Ref(qf->inputfields, op->inputfields,
137a2b73c81Sjeremylt                                      impl->evecs, impl->qdata, impl->qdata_alloc,
138a2b73c81Sjeremylt                                      impl->indata, 0, 0,
139885ac19cSjeremylt                                      qf->numinputfields, Q); CeedChk(ierr);
140885ac19cSjeremylt 
141885ac19cSjeremylt   // Outfields
142885ac19cSjeremylt   ierr = CeedOperatorSetupFields_Ref(qf->outputfields, op->outputfields,
143a2b73c81Sjeremylt                                      impl->evecs, impl->qdata, impl->qdata_alloc,
144a2b73c81Sjeremylt                                      impl->indata, qf->numinputfields,
145a2b73c81Sjeremylt                                      impl->numqin, qf->numoutputfields, Q); CeedChk(ierr);
146885ac19cSjeremylt 
147*8d94b059Sjeremylt   // Input Qvecs
148*8d94b059Sjeremylt   for (CeedInt i=0; i<qf->numinputfields; i++) {
149*8d94b059Sjeremylt     CeedEvalMode emode = qf->inputfields[i].emode;
150*8d94b059Sjeremylt     if ((emode != CEED_EVAL_NONE) && (emode != CEED_EVAL_WEIGHT))
151*8d94b059Sjeremylt       impl->indata[i] =  impl->qdata[i];
152*8d94b059Sjeremylt   }
1537ca8db16Sjeremylt   // Output Qvecs
1547ca8db16Sjeremylt   for (CeedInt i=0; i<qf->numoutputfields; i++) {
1557ca8db16Sjeremylt     CeedEvalMode emode = qf->outputfields[i].emode;
156*8d94b059Sjeremylt     if (emode != CEED_EVAL_NONE)
157a2b73c81Sjeremylt       impl->outdata[i] =  impl->qdata[i + qf->numinputfields];
1587ca8db16Sjeremylt   }
1597ca8db16Sjeremylt 
160885ac19cSjeremylt   op->setupdone = 1;
161885ac19cSjeremylt 
162885ac19cSjeremylt   return 0;
163885ac19cSjeremylt }
164885ac19cSjeremylt 
165885ac19cSjeremylt static int CeedOperatorApply_Ref(CeedOperator op, CeedVector invec,
166885ac19cSjeremylt                                  CeedVector outvec, CeedRequest *request) {
167a2b73c81Sjeremylt   CeedOperator_Ref *impl = op->data;
168885ac19cSjeremylt   CeedInt Q = op->numqpoints, elemsize;
169885ac19cSjeremylt   int ierr;
170885ac19cSjeremylt   CeedQFunction qf = op->qf;
171885ac19cSjeremylt   CeedTransposeMode lmode = CEED_NOTRANSPOSE;
172885ac19cSjeremylt 
173885ac19cSjeremylt   // Setup
174885ac19cSjeremylt   ierr = CeedOperatorSetup_Ref(op); CeedChk(ierr);
175885ac19cSjeremylt 
176885ac19cSjeremylt   // Input Evecs and Restriction
177135a076eSjeremylt   for (CeedInt i=0; i<qf->numinputfields; i++) {
178668048e2SJed Brown     CeedEvalMode emode = qf->inputfields[i].emode;
179135a076eSjeremylt     if (emode == CEED_EVAL_WEIGHT) { // Skip
180668048e2SJed Brown     } else {
181668048e2SJed Brown       // Active
182668048e2SJed Brown       if (op->inputfields[i].vec == CEED_VECTOR_ACTIVE) {
183668048e2SJed Brown         // Restrict
184668048e2SJed Brown         ierr = CeedElemRestrictionApply(op->inputfields[i].Erestrict, CEED_NOTRANSPOSE,
185a2b73c81Sjeremylt                                         lmode, invec, impl->evecs[i],
186668048e2SJed Brown                                         request); CeedChk(ierr);
187668048e2SJed Brown         // Get evec
188a2b73c81Sjeremylt         ierr = CeedVectorGetArrayRead(impl->evecs[i], CEED_MEM_HOST,
189a2b73c81Sjeremylt                                       (const CeedScalar **) &impl->edata[i]); CeedChk(ierr);
190668048e2SJed Brown       } else {
191885ac19cSjeremylt         // Passive
1927ca8db16Sjeremylt         // Restrict
193885ac19cSjeremylt         ierr = CeedElemRestrictionApply(op->inputfields[i].Erestrict, CEED_NOTRANSPOSE,
194a2b73c81Sjeremylt                                         lmode, op->inputfields[i].vec, impl->evecs[i],
195885ac19cSjeremylt                                         request); CeedChk(ierr);
1967ca8db16Sjeremylt         // Get evec
197a2b73c81Sjeremylt         ierr = CeedVectorGetArrayRead(impl->evecs[i], CEED_MEM_HOST,
198a2b73c81Sjeremylt                                       (const CeedScalar **) &impl->edata[i]); CeedChk(ierr);
199885ac19cSjeremylt       }
200885ac19cSjeremylt     }
201885ac19cSjeremylt   }
202885ac19cSjeremylt 
203885ac19cSjeremylt   // Output Evecs
204135a076eSjeremylt   for (CeedInt i=0; i<qf->numoutputfields; i++) {
205a2b73c81Sjeremylt     ierr = CeedVectorGetArray(impl->evecs[i+impl->numein], CEED_MEM_HOST,
206a2b73c81Sjeremylt                               &impl->edata[i + qf->numinputfields]); CeedChk(ierr);
207885ac19cSjeremylt   }
208885ac19cSjeremylt 
209885ac19cSjeremylt   // Loop through elements
210885ac19cSjeremylt   for (CeedInt e=0; e<op->numelements; e++) {
211885ac19cSjeremylt     // Input basis apply if needed
212885ac19cSjeremylt     for (CeedInt i=0; i<qf->numinputfields; i++) {
213135a076eSjeremylt       // Get elemsize, emode, ncomp
214885ac19cSjeremylt       elemsize = op->inputfields[i].Erestrict->elemsize;
215885ac19cSjeremylt       CeedEvalMode emode = qf->inputfields[i].emode;
216885ac19cSjeremylt       CeedInt ncomp = qf->inputfields[i].ncomp;
217885ac19cSjeremylt       // Basis action
218885ac19cSjeremylt       switch(emode) {
219885ac19cSjeremylt       case CEED_EVAL_NONE:
220a2b73c81Sjeremylt         impl->indata[i] = &impl->edata[i][e*Q*ncomp];
221885ac19cSjeremylt         break;
222885ac19cSjeremylt       case CEED_EVAL_INTERP:
223d3181881Sjeremylt         ierr = CeedBasisApply(op->inputfields[i].basis, 1, CEED_NOTRANSPOSE,
224a2b73c81Sjeremylt                               CEED_EVAL_INTERP, &impl->edata[i][e*elemsize*ncomp], impl->qdata[i]);
225885ac19cSjeremylt         CeedChk(ierr);
226885ac19cSjeremylt         break;
227885ac19cSjeremylt       case CEED_EVAL_GRAD:
228d3181881Sjeremylt         ierr = CeedBasisApply(op->inputfields[i].basis, 1, CEED_NOTRANSPOSE,
229a2b73c81Sjeremylt                               CEED_EVAL_GRAD, &impl->edata[i][e*elemsize*ncomp], impl->qdata[i]);
230885ac19cSjeremylt         CeedChk(ierr);
231885ac19cSjeremylt         break;
232885ac19cSjeremylt       case CEED_EVAL_WEIGHT:
233885ac19cSjeremylt         break;  // No action
234885ac19cSjeremylt       case CEED_EVAL_DIV:
235885ac19cSjeremylt         break; // Not implimented
236885ac19cSjeremylt       case CEED_EVAL_CURL:
237885ac19cSjeremylt         break; // Not implimented
238885ac19cSjeremylt       }
239885ac19cSjeremylt     }
240885ac19cSjeremylt     // Output pointers
241885ac19cSjeremylt     for (CeedInt i=0; i<qf->numoutputfields; i++) {
242885ac19cSjeremylt       CeedEvalMode emode = qf->outputfields[i].emode;
243885ac19cSjeremylt       if (emode == CEED_EVAL_NONE) {
244885ac19cSjeremylt         CeedInt ncomp = qf->outputfields[i].ncomp;
245a2b73c81Sjeremylt         impl->outdata[i] = &impl->edata[i + qf->numinputfields][e*Q*ncomp];
246885ac19cSjeremylt       }
247885ac19cSjeremylt     }
248885ac19cSjeremylt     // Q function
249a2b73c81Sjeremylt     ierr = CeedQFunctionApply(op->qf, Q, (const CeedScalar * const*) impl->indata,
250a2b73c81Sjeremylt                               impl->outdata); CeedChk(ierr);
251885ac19cSjeremylt 
252885ac19cSjeremylt     // Output basis apply if needed
253885ac19cSjeremylt     for (CeedInt i=0; i<qf->numoutputfields; i++) {
254135a076eSjeremylt       // Get elemsize, emode, ncomp
255885ac19cSjeremylt       elemsize = op->outputfields[i].Erestrict->elemsize;
256885ac19cSjeremylt       CeedInt ncomp = qf->outputfields[i].ncomp;
257885ac19cSjeremylt       CeedEvalMode emode = qf->outputfields[i].emode;
258885ac19cSjeremylt       // Basis action
259885ac19cSjeremylt       switch(emode) {
260885ac19cSjeremylt       case CEED_EVAL_NONE:
261885ac19cSjeremylt         break; // No action
262885ac19cSjeremylt       case CEED_EVAL_INTERP:
263d3181881Sjeremylt         ierr = CeedBasisApply(op->outputfields[i].basis, 1, CEED_TRANSPOSE,
264a2b73c81Sjeremylt                               CEED_EVAL_INTERP, impl->outdata[i],
265*8d94b059Sjeremylt                               &impl->edata[i + qf->numinputfields][e*elemsize*ncomp]);
266*8d94b059Sjeremylt         CeedChk(ierr);
267885ac19cSjeremylt         break;
268885ac19cSjeremylt       case CEED_EVAL_GRAD:
2690c7a96bbSjeremylt         ierr = CeedBasisApply(op->outputfields[i].basis, 1, CEED_TRANSPOSE,
2700c7a96bbSjeremylt                               CEED_EVAL_GRAD,
271a2b73c81Sjeremylt                               impl->outdata[i], &impl->edata[i + qf->numinputfields][e*elemsize*ncomp]);
272885ac19cSjeremylt         CeedChk(ierr);
273885ac19cSjeremylt         break;
274885ac19cSjeremylt       case CEED_EVAL_WEIGHT:
275*8d94b059Sjeremylt         return CeedError(op->ceed, 1,
276*8d94b059Sjeremylt                          "CEED_EVAL_WEIGHT cannot be an output evaluation mode");
277885ac19cSjeremylt         break; // Should not occur
278885ac19cSjeremylt       case CEED_EVAL_DIV:
279885ac19cSjeremylt         break; // Not implimented
280885ac19cSjeremylt       case CEED_EVAL_CURL:
281885ac19cSjeremylt         break; // Not implimented
282885ac19cSjeremylt       }
283885ac19cSjeremylt     }
284885ac19cSjeremylt   }
285885ac19cSjeremylt 
286885ac19cSjeremylt   // Output restriction
287135a076eSjeremylt   for (CeedInt i=0; i<qf->numoutputfields; i++) {
288a2b73c81Sjeremylt     // Restore evec
289a2b73c81Sjeremylt     ierr = CeedVectorRestoreArray(impl->evecs[i+impl->numein],
290a2b73c81Sjeremylt                                     &impl->edata[i + qf->numinputfields]); CeedChk(ierr);
291668048e2SJed Brown     // Active
292668048e2SJed Brown     if (op->outputfields[i].vec == CEED_VECTOR_ACTIVE) {
2937ca8db16Sjeremylt       // Zero lvec
294a2b73c81Sjeremylt       ierr = CeedVectorSetValue(outvec, 0.0); CeedChk(ierr);
2957ca8db16Sjeremylt       // Restrict
296885ac19cSjeremylt       ierr = CeedElemRestrictionApply(op->outputfields[i].Erestrict, CEED_TRANSPOSE,
297a2b73c81Sjeremylt                                       lmode, impl->evecs[i+impl->numein], outvec, request); CeedChk(ierr);
298885ac19cSjeremylt     } else {
299885ac19cSjeremylt       // Passive
300668048e2SJed Brown       // Zero lvec
301a2b73c81Sjeremylt       ierr = CeedVectorSetValue(op->outputfields[i].vec, 0.0); CeedChk(ierr);
302668048e2SJed Brown       // Restrict
303668048e2SJed Brown       ierr = CeedElemRestrictionApply(op->outputfields[i].Erestrict, CEED_TRANSPOSE,
304a2b73c81Sjeremylt                                       lmode, impl->evecs[i+impl->numein], op->outputfields[i].vec,
305668048e2SJed Brown                                       request); CeedChk(ierr);
306885ac19cSjeremylt     }
307885ac19cSjeremylt   }
308885ac19cSjeremylt 
3097ca8db16Sjeremylt   // Restore input arrays
310135a076eSjeremylt   for (CeedInt i=0; i<qf->numinputfields; i++) {
3117ca8db16Sjeremylt     CeedEvalMode emode = qf->inputfields[i].emode;
312135a076eSjeremylt     if (emode == CEED_EVAL_WEIGHT) { // Skip
3137ca8db16Sjeremylt     } else {
314a2b73c81Sjeremylt       ierr = CeedVectorRestoreArrayRead(impl->evecs[i],
315a2b73c81Sjeremylt                                         (const CeedScalar **) &impl->edata[i]); CeedChk(ierr);
3167ca8db16Sjeremylt     }
3177ca8db16Sjeremylt   }
3187ca8db16Sjeremylt 
31921617c04Sjeremylt   return 0;
32021617c04Sjeremylt }
32121617c04Sjeremylt 
32221617c04Sjeremylt int CeedOperatorCreate_Ref(CeedOperator op) {
32321617c04Sjeremylt   CeedOperator_Ref *impl;
32421617c04Sjeremylt   int ierr;
32521617c04Sjeremylt 
32621617c04Sjeremylt   ierr = CeedCalloc(1, &impl); CeedChk(ierr);
32721617c04Sjeremylt   op->data = impl;
32821617c04Sjeremylt   op->Destroy = CeedOperatorDestroy_Ref;
32921617c04Sjeremylt   op->Apply = CeedOperatorApply_Ref;
33021617c04Sjeremylt   return 0;
33121617c04Sjeremylt }
332