xref: /libCEED/backends/ref/ceed-ref-operator.c (revision 4b8bea3b15f6e9705ea378b18162a3dbd250c6ec)
121617c04Sjeremylt // Copyright (c) 2017-2018, Lawrence Livermore National Security, LLC.
221617c04Sjeremylt // Produced at the Lawrence Livermore National Laboratory. LLNL-CODE-734707.
321617c04Sjeremylt // All Rights reserved. See files LICENSE and NOTICE for details.
421617c04Sjeremylt //
521617c04Sjeremylt // This file is part of CEED, a collection of benchmarks, miniapps, software
621617c04Sjeremylt // libraries and APIs for efficient high-order finite element and spectral
721617c04Sjeremylt // element discretizations for exascale applications. For more information and
821617c04Sjeremylt // source code availability see http://github.com/ceed.
921617c04Sjeremylt //
1021617c04Sjeremylt // The CEED research is supported by the Exascale Computing Project 17-SC-20-SC,
1121617c04Sjeremylt // a collaborative effort of two U.S. Department of Energy organizations (Office
1221617c04Sjeremylt // of Science and the National Nuclear Security Administration) responsible for
1321617c04Sjeremylt // the planning and preparation of a capable exascale ecosystem, including
1421617c04Sjeremylt // software, applications, hardware, advanced system engineering and early
1521617c04Sjeremylt // testbed platforms, in support of the nation's exascale computing imperative.
1621617c04Sjeremylt 
1721617c04Sjeremylt #include <ceed-impl.h>
1821617c04Sjeremylt #include <string.h>
1921617c04Sjeremylt #include "ceed-ref.h"
2021617c04Sjeremylt 
2121617c04Sjeremylt static int CeedOperatorDestroy_Ref(CeedOperator op) {
2221617c04Sjeremylt   CeedOperator_Ref *impl = op->data;
2321617c04Sjeremylt   int ierr;
2421617c04Sjeremylt 
25885ac19cSjeremylt   for (CeedInt i=0; i<impl->numein+impl->numeout; i++) {
26885ac19cSjeremylt     ierr = CeedVectorDestroy(&impl->evecs[i]); CeedChk(ierr);
27885ac19cSjeremylt   }
28885ac19cSjeremylt   ierr = CeedFree(&impl->evecs); CeedChk(ierr);
29885ac19cSjeremylt   ierr = CeedFree(&impl->edata); CeedChk(ierr);
30885ac19cSjeremylt 
31885ac19cSjeremylt   for (CeedInt i=0; i<impl->numqin+impl->numqout; i++) {
32885ac19cSjeremylt     ierr = CeedFree(&impl->qdata_alloc[i]); CeedChk(ierr);
33885ac19cSjeremylt   }
34885ac19cSjeremylt   ierr = CeedFree(&impl->qdata_alloc); CeedChk(ierr);
35885ac19cSjeremylt   ierr = CeedFree(&impl->qdata); CeedChk(ierr);
36885ac19cSjeremylt 
37885ac19cSjeremylt   ierr = CeedFree(&impl->indata); CeedChk(ierr);
38885ac19cSjeremylt   ierr = CeedFree(&impl->outdata); CeedChk(ierr);
39885ac19cSjeremylt 
4021617c04Sjeremylt   ierr = CeedFree(&op->data); CeedChk(ierr);
4121617c04Sjeremylt   return 0;
4221617c04Sjeremylt }
4321617c04Sjeremylt 
44885ac19cSjeremylt /*
45885ac19cSjeremylt   Setup infields or outfields
46885ac19cSjeremylt  */
47885ac19cSjeremylt static int CeedOperatorSetupFields_Ref(struct CeedQFunctionField qfields[16],
48885ac19cSjeremylt                                        struct CeedOperatorField ofields[16],
49885ac19cSjeremylt                                        CeedVector *evecs, CeedScalar **qdata,
50885ac19cSjeremylt                                        CeedScalar **qdata_alloc, CeedScalar **indata,
51135a076eSjeremylt                                        CeedInt starti, CeedInt startq,
52135a076eSjeremylt                                        CeedInt numfields, CeedInt Q) {
53135a076eSjeremylt   CeedInt dim, ierr, iq=startq, ncomp;
5421617c04Sjeremylt 
55885ac19cSjeremylt   // Loop over fields
56885ac19cSjeremylt   for (CeedInt i=0; i<numfields; i++) {
57885ac19cSjeremylt     CeedEvalMode emode = qfields[i].emode;
58135a076eSjeremylt 
59135a076eSjeremylt     if (emode != CEED_EVAL_WEIGHT) {
60*4b8bea3bSJed Brown       ierr = CeedElemRestrictionCreateVector(ofields[i].Erestrict, NULL,
61*4b8bea3bSJed Brown                                              &evecs[i+starti]);
62135a076eSjeremylt       CeedChk(ierr);
63135a076eSjeremylt     }
64135a076eSjeremylt 
65885ac19cSjeremylt     switch(emode) {
66885ac19cSjeremylt     case CEED_EVAL_NONE:
67885ac19cSjeremylt       break; // No action
68885ac19cSjeremylt     case CEED_EVAL_INTERP:
69885ac19cSjeremylt       ncomp = qfields[i].ncomp;
70885ac19cSjeremylt       ierr = CeedMalloc(Q*ncomp, &qdata_alloc[iq]); CeedChk(ierr);
71885ac19cSjeremylt       qdata[i + starti] = qdata_alloc[iq];
72885ac19cSjeremylt       iq++;
73885ac19cSjeremylt       break;
74885ac19cSjeremylt     case CEED_EVAL_GRAD:
75885ac19cSjeremylt       ncomp = qfields[i].ncomp;
76885ac19cSjeremylt       dim = ofields[i].basis->dim;
77885ac19cSjeremylt       ierr = CeedMalloc(Q*ncomp*dim, &qdata_alloc[iq]); CeedChk(ierr);
78885ac19cSjeremylt       qdata[i + starti] = qdata_alloc[iq];
79885ac19cSjeremylt       iq++;
80885ac19cSjeremylt       break;
81885ac19cSjeremylt     case CEED_EVAL_WEIGHT: // Only on input fields
82885ac19cSjeremylt       ierr = CeedMalloc(Q, &qdata_alloc[iq]); CeedChk(ierr);
83d3181881Sjeremylt       ierr = CeedBasisApply(ofields[iq].basis, 1, CEED_NOTRANSPOSE, CEED_EVAL_WEIGHT,
84885ac19cSjeremylt                             NULL, qdata_alloc[iq]); CeedChk(ierr);
85885ac19cSjeremylt       qdata[i] = qdata_alloc[iq];
86885ac19cSjeremylt       indata[i] = qdata[i];
87885ac19cSjeremylt       iq++;
88885ac19cSjeremylt       break;
89885ac19cSjeremylt     case CEED_EVAL_DIV:
90885ac19cSjeremylt       break; // Not implimented
91885ac19cSjeremylt     case CEED_EVAL_CURL:
92885ac19cSjeremylt       break; // Not implimented
9321617c04Sjeremylt     }
94885ac19cSjeremylt   }
9521617c04Sjeremylt   return 0;
9621617c04Sjeremylt }
9721617c04Sjeremylt 
98885ac19cSjeremylt /*
99885ac19cSjeremylt   CeedOperator needs to connect all the named fields (be they active or passive)
100885ac19cSjeremylt   to the named inputs and outputs of its CeedQFunction.
101885ac19cSjeremylt  */
102885ac19cSjeremylt static int CeedOperatorSetup_Ref(CeedOperator op) {
103885ac19cSjeremylt   if (op->setupdone) return 0;
104a2b73c81Sjeremylt   CeedOperator_Ref *impl = op->data;
105885ac19cSjeremylt   CeedQFunction qf = op->qf;
106885ac19cSjeremylt   CeedInt Q = op->numqpoints;
10721617c04Sjeremylt   int ierr;
10821617c04Sjeremylt 
109885ac19cSjeremylt   // Count infield and outfield array sizes and evectors
110a2b73c81Sjeremylt   impl->numein = qf->numinputfields;
111885ac19cSjeremylt   for (CeedInt i=0; i<qf->numinputfields; i++) {
112885ac19cSjeremylt     CeedEvalMode emode = qf->inputfields[i].emode;
1138d94b059Sjeremylt     impl->numqin += !!(emode & CEED_EVAL_INTERP) + !!(emode & CEED_EVAL_GRAD) +
1148d94b059Sjeremylt                     !!(emode & CEED_EVAL_WEIGHT);
11521617c04Sjeremylt   }
116a2b73c81Sjeremylt   impl->numeout = qf->numoutputfields;
117885ac19cSjeremylt   for (CeedInt i=0; i<qf->numoutputfields; i++) {
118885ac19cSjeremylt     CeedEvalMode emode = qf->outputfields[i].emode;
119a2b73c81Sjeremylt     impl->numqout += !!(emode & CEED_EVAL_INTERP) + !!(emode & CEED_EVAL_GRAD);
120885ac19cSjeremylt   }
121885ac19cSjeremylt 
122885ac19cSjeremylt   // Allocate
123a2b73c81Sjeremylt   ierr = CeedCalloc(impl->numein + impl->numeout, &impl->evecs); CeedChk(ierr);
124a2b73c81Sjeremylt   ierr = CeedCalloc(impl->numein + impl->numeout, &impl->edata);
125885ac19cSjeremylt   CeedChk(ierr);
126885ac19cSjeremylt 
127a2b73c81Sjeremylt   ierr = CeedCalloc(impl->numqin + impl->numqout, &impl->qdata_alloc);
128885ac19cSjeremylt   CeedChk(ierr);
129a2b73c81Sjeremylt   ierr = CeedCalloc(qf->numinputfields + qf->numoutputfields, &impl->qdata);
130885ac19cSjeremylt   CeedChk(ierr);
131885ac19cSjeremylt 
132a2b73c81Sjeremylt   ierr = CeedCalloc(16, &impl->indata); CeedChk(ierr);
133a2b73c81Sjeremylt   ierr = CeedCalloc(16, &impl->outdata); CeedChk(ierr);
134885ac19cSjeremylt 
135885ac19cSjeremylt   // Set up infield and outfield pointer arrays
136885ac19cSjeremylt   // Infields
137885ac19cSjeremylt   ierr = CeedOperatorSetupFields_Ref(qf->inputfields, op->inputfields,
138a2b73c81Sjeremylt                                      impl->evecs, impl->qdata, impl->qdata_alloc,
139a2b73c81Sjeremylt                                      impl->indata, 0, 0,
140885ac19cSjeremylt                                      qf->numinputfields, Q); CeedChk(ierr);
141885ac19cSjeremylt 
142885ac19cSjeremylt   // Outfields
143885ac19cSjeremylt   ierr = CeedOperatorSetupFields_Ref(qf->outputfields, op->outputfields,
144a2b73c81Sjeremylt                                      impl->evecs, impl->qdata, impl->qdata_alloc,
145a2b73c81Sjeremylt                                      impl->indata, qf->numinputfields,
146a2b73c81Sjeremylt                                      impl->numqin, qf->numoutputfields, Q); CeedChk(ierr);
147885ac19cSjeremylt 
1488d94b059Sjeremylt   // Input Qvecs
1498d94b059Sjeremylt   for (CeedInt i=0; i<qf->numinputfields; i++) {
1508d94b059Sjeremylt     CeedEvalMode emode = qf->inputfields[i].emode;
1518d94b059Sjeremylt     if ((emode != CEED_EVAL_NONE) && (emode != CEED_EVAL_WEIGHT))
1528d94b059Sjeremylt       impl->indata[i] =  impl->qdata[i];
1538d94b059Sjeremylt   }
1547ca8db16Sjeremylt   // Output Qvecs
1557ca8db16Sjeremylt   for (CeedInt i=0; i<qf->numoutputfields; i++) {
1567ca8db16Sjeremylt     CeedEvalMode emode = qf->outputfields[i].emode;
1578d94b059Sjeremylt     if (emode != CEED_EVAL_NONE)
158a2b73c81Sjeremylt       impl->outdata[i] =  impl->qdata[i + qf->numinputfields];
1597ca8db16Sjeremylt   }
1607ca8db16Sjeremylt 
161885ac19cSjeremylt   op->setupdone = 1;
162885ac19cSjeremylt 
163885ac19cSjeremylt   return 0;
164885ac19cSjeremylt }
165885ac19cSjeremylt 
166885ac19cSjeremylt static int CeedOperatorApply_Ref(CeedOperator op, CeedVector invec,
167885ac19cSjeremylt                                  CeedVector outvec, CeedRequest *request) {
168a2b73c81Sjeremylt   CeedOperator_Ref *impl = op->data;
169885ac19cSjeremylt   CeedInt Q = op->numqpoints, elemsize;
170885ac19cSjeremylt   int ierr;
171885ac19cSjeremylt   CeedQFunction qf = op->qf;
172885ac19cSjeremylt   CeedTransposeMode lmode = CEED_NOTRANSPOSE;
173885ac19cSjeremylt 
174885ac19cSjeremylt   // Setup
175885ac19cSjeremylt   ierr = CeedOperatorSetup_Ref(op); CeedChk(ierr);
176885ac19cSjeremylt 
177885ac19cSjeremylt   // Input Evecs and Restriction
178135a076eSjeremylt   for (CeedInt i=0; i<qf->numinputfields; i++) {
179668048e2SJed Brown     CeedEvalMode emode = qf->inputfields[i].emode;
180135a076eSjeremylt     if (emode == CEED_EVAL_WEIGHT) { // Skip
181668048e2SJed Brown     } else {
182668048e2SJed Brown       // Active
183668048e2SJed Brown       if (op->inputfields[i].vec == CEED_VECTOR_ACTIVE) {
184668048e2SJed Brown         // Restrict
185668048e2SJed Brown         ierr = CeedElemRestrictionApply(op->inputfields[i].Erestrict, CEED_NOTRANSPOSE,
186a2b73c81Sjeremylt                                         lmode, invec, impl->evecs[i],
187668048e2SJed Brown                                         request); CeedChk(ierr);
188668048e2SJed Brown         // Get evec
189a2b73c81Sjeremylt         ierr = CeedVectorGetArrayRead(impl->evecs[i], CEED_MEM_HOST,
190a2b73c81Sjeremylt                                       (const CeedScalar **) &impl->edata[i]); CeedChk(ierr);
191668048e2SJed Brown       } else {
192885ac19cSjeremylt         // Passive
1937ca8db16Sjeremylt         // Restrict
194885ac19cSjeremylt         ierr = CeedElemRestrictionApply(op->inputfields[i].Erestrict, CEED_NOTRANSPOSE,
195a2b73c81Sjeremylt                                         lmode, op->inputfields[i].vec, impl->evecs[i],
196885ac19cSjeremylt                                         request); CeedChk(ierr);
1977ca8db16Sjeremylt         // Get evec
198a2b73c81Sjeremylt         ierr = CeedVectorGetArrayRead(impl->evecs[i], CEED_MEM_HOST,
199a2b73c81Sjeremylt                                       (const CeedScalar **) &impl->edata[i]); CeedChk(ierr);
200885ac19cSjeremylt       }
201885ac19cSjeremylt     }
202885ac19cSjeremylt   }
203885ac19cSjeremylt 
204885ac19cSjeremylt   // Output Evecs
205135a076eSjeremylt   for (CeedInt i=0; i<qf->numoutputfields; i++) {
206a2b73c81Sjeremylt     ierr = CeedVectorGetArray(impl->evecs[i+impl->numein], CEED_MEM_HOST,
207a2b73c81Sjeremylt                               &impl->edata[i + qf->numinputfields]); CeedChk(ierr);
208885ac19cSjeremylt   }
209885ac19cSjeremylt 
210885ac19cSjeremylt   // Loop through elements
211885ac19cSjeremylt   for (CeedInt e=0; e<op->numelements; e++) {
212885ac19cSjeremylt     // Input basis apply if needed
213885ac19cSjeremylt     for (CeedInt i=0; i<qf->numinputfields; i++) {
214135a076eSjeremylt       // Get elemsize, emode, ncomp
215885ac19cSjeremylt       elemsize = op->inputfields[i].Erestrict->elemsize;
216885ac19cSjeremylt       CeedEvalMode emode = qf->inputfields[i].emode;
217885ac19cSjeremylt       CeedInt ncomp = qf->inputfields[i].ncomp;
218885ac19cSjeremylt       // Basis action
219885ac19cSjeremylt       switch(emode) {
220885ac19cSjeremylt       case CEED_EVAL_NONE:
221a2b73c81Sjeremylt         impl->indata[i] = &impl->edata[i][e*Q*ncomp];
222885ac19cSjeremylt         break;
223885ac19cSjeremylt       case CEED_EVAL_INTERP:
224d3181881Sjeremylt         ierr = CeedBasisApply(op->inputfields[i].basis, 1, CEED_NOTRANSPOSE,
225a2b73c81Sjeremylt                               CEED_EVAL_INTERP, &impl->edata[i][e*elemsize*ncomp], impl->qdata[i]);
226885ac19cSjeremylt         CeedChk(ierr);
227885ac19cSjeremylt         break;
228885ac19cSjeremylt       case CEED_EVAL_GRAD:
229d3181881Sjeremylt         ierr = CeedBasisApply(op->inputfields[i].basis, 1, CEED_NOTRANSPOSE,
230a2b73c81Sjeremylt                               CEED_EVAL_GRAD, &impl->edata[i][e*elemsize*ncomp], impl->qdata[i]);
231885ac19cSjeremylt         CeedChk(ierr);
232885ac19cSjeremylt         break;
233885ac19cSjeremylt       case CEED_EVAL_WEIGHT:
234885ac19cSjeremylt         break;  // No action
235885ac19cSjeremylt       case CEED_EVAL_DIV:
236885ac19cSjeremylt         break; // Not implimented
237885ac19cSjeremylt       case CEED_EVAL_CURL:
238885ac19cSjeremylt         break; // Not implimented
239885ac19cSjeremylt       }
240885ac19cSjeremylt     }
241885ac19cSjeremylt     // Output pointers
242885ac19cSjeremylt     for (CeedInt i=0; i<qf->numoutputfields; i++) {
243885ac19cSjeremylt       CeedEvalMode emode = qf->outputfields[i].emode;
244885ac19cSjeremylt       if (emode == CEED_EVAL_NONE) {
245885ac19cSjeremylt         CeedInt ncomp = qf->outputfields[i].ncomp;
246a2b73c81Sjeremylt         impl->outdata[i] = &impl->edata[i + qf->numinputfields][e*Q*ncomp];
247885ac19cSjeremylt       }
248885ac19cSjeremylt     }
249885ac19cSjeremylt     // Q function
250a2b73c81Sjeremylt     ierr = CeedQFunctionApply(op->qf, Q, (const CeedScalar * const*) impl->indata,
251a2b73c81Sjeremylt                               impl->outdata); CeedChk(ierr);
252885ac19cSjeremylt 
253885ac19cSjeremylt     // Output basis apply if needed
254885ac19cSjeremylt     for (CeedInt i=0; i<qf->numoutputfields; i++) {
255135a076eSjeremylt       // Get elemsize, emode, ncomp
256885ac19cSjeremylt       elemsize = op->outputfields[i].Erestrict->elemsize;
257885ac19cSjeremylt       CeedInt ncomp = qf->outputfields[i].ncomp;
258885ac19cSjeremylt       CeedEvalMode emode = qf->outputfields[i].emode;
259885ac19cSjeremylt       // Basis action
260885ac19cSjeremylt       switch(emode) {
261885ac19cSjeremylt       case CEED_EVAL_NONE:
262885ac19cSjeremylt         break; // No action
263885ac19cSjeremylt       case CEED_EVAL_INTERP:
264d3181881Sjeremylt         ierr = CeedBasisApply(op->outputfields[i].basis, 1, CEED_TRANSPOSE,
265a2b73c81Sjeremylt                               CEED_EVAL_INTERP, impl->outdata[i],
2668d94b059Sjeremylt                               &impl->edata[i + qf->numinputfields][e*elemsize*ncomp]);
2678d94b059Sjeremylt         CeedChk(ierr);
268885ac19cSjeremylt         break;
269885ac19cSjeremylt       case CEED_EVAL_GRAD:
2700c7a96bbSjeremylt         ierr = CeedBasisApply(op->outputfields[i].basis, 1, CEED_TRANSPOSE,
2710c7a96bbSjeremylt                               CEED_EVAL_GRAD,
272a2b73c81Sjeremylt                               impl->outdata[i], &impl->edata[i + qf->numinputfields][e*elemsize*ncomp]);
273885ac19cSjeremylt         CeedChk(ierr);
274885ac19cSjeremylt         break;
275885ac19cSjeremylt       case CEED_EVAL_WEIGHT:
2768d94b059Sjeremylt         return CeedError(op->ceed, 1,
2778d94b059Sjeremylt                          "CEED_EVAL_WEIGHT cannot be an output evaluation mode");
278885ac19cSjeremylt         break; // Should not occur
279885ac19cSjeremylt       case CEED_EVAL_DIV:
280885ac19cSjeremylt         break; // Not implimented
281885ac19cSjeremylt       case CEED_EVAL_CURL:
282885ac19cSjeremylt         break; // Not implimented
283885ac19cSjeremylt       }
284885ac19cSjeremylt     }
285885ac19cSjeremylt   }
286885ac19cSjeremylt 
287885ac19cSjeremylt   // Output restriction
288135a076eSjeremylt   for (CeedInt i=0; i<qf->numoutputfields; i++) {
289a2b73c81Sjeremylt     // Restore evec
290a2b73c81Sjeremylt     ierr = CeedVectorRestoreArray(impl->evecs[i+impl->numein],
291a2b73c81Sjeremylt                                   &impl->edata[i + qf->numinputfields]); CeedChk(ierr);
292668048e2SJed Brown     // Active
293668048e2SJed Brown     if (op->outputfields[i].vec == CEED_VECTOR_ACTIVE) {
2947ca8db16Sjeremylt       // Zero lvec
295a2b73c81Sjeremylt       ierr = CeedVectorSetValue(outvec, 0.0); CeedChk(ierr);
2967ca8db16Sjeremylt       // Restrict
297885ac19cSjeremylt       ierr = CeedElemRestrictionApply(op->outputfields[i].Erestrict, CEED_TRANSPOSE,
298a2b73c81Sjeremylt                                       lmode, impl->evecs[i+impl->numein], outvec, request); CeedChk(ierr);
299885ac19cSjeremylt     } else {
300885ac19cSjeremylt       // Passive
301668048e2SJed Brown       // Zero lvec
302a2b73c81Sjeremylt       ierr = CeedVectorSetValue(op->outputfields[i].vec, 0.0); CeedChk(ierr);
303668048e2SJed Brown       // Restrict
304668048e2SJed Brown       ierr = CeedElemRestrictionApply(op->outputfields[i].Erestrict, CEED_TRANSPOSE,
305a2b73c81Sjeremylt                                       lmode, impl->evecs[i+impl->numein], op->outputfields[i].vec,
306668048e2SJed Brown                                       request); CeedChk(ierr);
307885ac19cSjeremylt     }
308885ac19cSjeremylt   }
309885ac19cSjeremylt 
3107ca8db16Sjeremylt   // Restore input arrays
311135a076eSjeremylt   for (CeedInt i=0; i<qf->numinputfields; i++) {
3127ca8db16Sjeremylt     CeedEvalMode emode = qf->inputfields[i].emode;
313135a076eSjeremylt     if (emode == CEED_EVAL_WEIGHT) { // Skip
3147ca8db16Sjeremylt     } else {
315a2b73c81Sjeremylt       ierr = CeedVectorRestoreArrayRead(impl->evecs[i],
316a2b73c81Sjeremylt                                         (const CeedScalar **) &impl->edata[i]); CeedChk(ierr);
3177ca8db16Sjeremylt     }
3187ca8db16Sjeremylt   }
3197ca8db16Sjeremylt 
32021617c04Sjeremylt   return 0;
32121617c04Sjeremylt }
32221617c04Sjeremylt 
32321617c04Sjeremylt int CeedOperatorCreate_Ref(CeedOperator op) {
32421617c04Sjeremylt   CeedOperator_Ref *impl;
32521617c04Sjeremylt   int ierr;
32621617c04Sjeremylt 
32721617c04Sjeremylt   ierr = CeedCalloc(1, &impl); CeedChk(ierr);
32821617c04Sjeremylt   op->data = impl;
32921617c04Sjeremylt   op->Destroy = CeedOperatorDestroy_Ref;
33021617c04Sjeremylt   op->Apply = CeedOperatorApply_Ref;
33121617c04Sjeremylt   return 0;
33221617c04Sjeremylt }
333