xref: /petsc/src/ksp/pc/impls/bddc/bddcgraph.c (revision 2bf68e3e0f2a61f71e7c65bee250bfa1c8ce0cdb)
1 #include <petsc/private/petscimpl.h>
2 #include <../src/ksp/pc/impls/bddc/bddcprivate.h>
3 #include <../src/ksp/pc/impls/bddc/bddcstructs.h>
4 
5 #undef __FUNCT__
6 #define __FUNCT__ "PCBDDCGraphGetDirichletDofsB"
7 PetscErrorCode PCBDDCGraphGetDirichletDofsB(PCBDDCGraph graph, IS* dirdofs)
8 {
9   PetscErrorCode ierr;
10 
11   PetscFunctionBegin;
12   if (graph->dirdofsB) {
13     ierr = PetscObjectReference((PetscObject)graph->dirdofsB);CHKERRQ(ierr);
14   } else if (graph->has_dirichlet) {
15     PetscInt i,size;
16     PetscInt *dirdofs_idxs;
17 
18     size = 0;
19     for (i=0;i<graph->nvtxs;i++) {
20       if (graph->count[i] && graph->special_dof[i] == PCBDDCGRAPH_DIRICHLET_MARK) size++;
21     }
22 
23     ierr = PetscMalloc1(size,&dirdofs_idxs);CHKERRQ(ierr);
24     size = 0;
25     for (i=0;i<graph->nvtxs;i++) {
26       if (graph->count[i] && graph->special_dof[i] == PCBDDCGRAPH_DIRICHLET_MARK) dirdofs_idxs[size++] = i;
27     }
28     ierr = ISCreateGeneral(PETSC_COMM_SELF,size,dirdofs_idxs,PETSC_OWN_POINTER,&graph->dirdofsB);CHKERRQ(ierr);
29     ierr = PetscObjectReference((PetscObject)graph->dirdofsB);CHKERRQ(ierr);
30   }
31   *dirdofs = graph->dirdofsB;
32   PetscFunctionReturn(0);
33 }
34 
35 #undef __FUNCT__
36 #define __FUNCT__ "PCBDDCGraphGetDirichletDofs"
37 PetscErrorCode PCBDDCGraphGetDirichletDofs(PCBDDCGraph graph, IS* dirdofs)
38 {
39   PetscErrorCode ierr;
40 
41   PetscFunctionBegin;
42   if (graph->dirdofs) {
43     ierr = PetscObjectReference((PetscObject)graph->dirdofs);CHKERRQ(ierr);
44   } else if (graph->has_dirichlet) {
45     PetscInt i,size;
46     PetscInt *dirdofs_idxs;
47 
48     size = 0;
49     for (i=0;i<graph->nvtxs;i++) {
50       if (graph->special_dof[i] == PCBDDCGRAPH_DIRICHLET_MARK) size++;
51     }
52 
53     ierr = PetscMalloc1(size,&dirdofs_idxs);CHKERRQ(ierr);
54     size = 0;
55     for (i=0;i<graph->nvtxs;i++) {
56       if (graph->special_dof[i] == PCBDDCGRAPH_DIRICHLET_MARK) dirdofs_idxs[size++] = i;
57     }
58     ierr = ISCreateGeneral(PetscObjectComm((PetscObject)graph->l2gmap),size,dirdofs_idxs,PETSC_OWN_POINTER,&graph->dirdofs);CHKERRQ(ierr);
59     ierr = PetscObjectReference((PetscObject)graph->dirdofs);CHKERRQ(ierr);
60   }
61   *dirdofs = graph->dirdofs;
62   PetscFunctionReturn(0);
63 }
64 
65 #undef __FUNCT__
66 #define __FUNCT__ "PCBDDCGraphASCIIView"
67 PetscErrorCode PCBDDCGraphASCIIView(PCBDDCGraph graph, PetscInt verbosity_level, PetscViewer viewer)
68 {
69   PetscInt       i,j,tabs;
70   PetscInt*      queue_in_global_numbering;
71   PetscErrorCode ierr;
72 
73   PetscFunctionBegin;
74   ierr = PetscViewerASCIIPushSynchronized(viewer);CHKERRQ(ierr);
75   ierr = PetscViewerASCIIGetTab(viewer,&tabs);CHKERRQ(ierr);
76   ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
77   ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
78   ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Local BDDC graph for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
79   ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Number of vertices %d\n",graph->nvtxs);CHKERRQ(ierr);
80   ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Custom minimal size %d\n",graph->custom_minimal_size);CHKERRQ(ierr);
81   ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Max count %d\n",graph->maxcount);CHKERRQ(ierr);
82   ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Topological two dim? %d (set %d)\n",graph->twodim,graph->twodimset);CHKERRQ(ierr);
83   if (verbosity_level > 2) {
84     for (i=0;i<graph->nvtxs;i++) {
85       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d:\n",i);CHKERRQ(ierr);
86       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"   which_dof: %d\n",graph->which_dof[i]);CHKERRQ(ierr);
87       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"   special_dof: %d\n",graph->special_dof[i]);CHKERRQ(ierr);
88       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"   neighbours: %d\n",graph->count[i]);CHKERRQ(ierr);
89       ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
90       if (graph->count[i]) {
91         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"     set of neighbours:");CHKERRQ(ierr);
92         for (j=0;j<graph->count[i];j++) {
93           ierr = PetscViewerASCIISynchronizedPrintf(viewer," %d",graph->neighbours_set[i][j]);CHKERRQ(ierr);
94         }
95         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");CHKERRQ(ierr);
96       }
97       ierr = PetscViewerASCIISetTab(viewer,tabs);CHKERRQ(ierr);
98       ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
99       if (graph->mirrors) {
100         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"   mirrors: %d\n",graph->mirrors[i]);CHKERRQ(ierr);
101         if (graph->mirrors[i]) {
102           ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
103           ierr = PetscViewerASCIISynchronizedPrintf(viewer,"     set of mirrors:");CHKERRQ(ierr);
104           for (j=0;j<graph->mirrors[i];j++) {
105             ierr = PetscViewerASCIISynchronizedPrintf(viewer," %d",graph->mirrors_set[i][j]);CHKERRQ(ierr);
106           }
107           ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");CHKERRQ(ierr);
108           ierr = PetscViewerASCIISetTab(viewer,tabs);CHKERRQ(ierr);
109           ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
110         }
111       }
112       if (verbosity_level > 3) {
113         if (graph->xadj) {
114           ierr = PetscViewerASCIISynchronizedPrintf(viewer,"   local adj list:");CHKERRQ(ierr);
115           ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
116           for (j=graph->xadj[i];j<graph->xadj[i+1];j++) {
117             ierr = PetscViewerASCIISynchronizedPrintf(viewer," %d",graph->adjncy[j]);CHKERRQ(ierr);
118           }
119           ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");CHKERRQ(ierr);
120           ierr = PetscViewerASCIISetTab(viewer,tabs);CHKERRQ(ierr);
121           ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
122         } else {
123           ierr = PetscViewerASCIISynchronizedPrintf(viewer,"   no adj info\n");CHKERRQ(ierr);
124         }
125       }
126       if (graph->n_local_subs) {
127         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"   local sub id: %d\n",graph->local_subs[i]);CHKERRQ(ierr);
128       }
129       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"   interface subset id: %d\n",graph->subset[i]);CHKERRQ(ierr);
130       if (graph->subset[i] && graph->subset_ncc) {
131         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"   ncc for subset: %d\n",graph->subset_ncc[graph->subset[i]-1]);CHKERRQ(ierr);
132       }
133     }
134   }
135   ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Total number of connected components %d\n",graph->ncc);CHKERRQ(ierr);
136   ierr = PetscMalloc1(graph->cptr[graph->ncc],&queue_in_global_numbering);CHKERRQ(ierr);
137   ierr = ISLocalToGlobalMappingApply(graph->l2gmap,graph->cptr[graph->ncc],graph->queue,queue_in_global_numbering);CHKERRQ(ierr);
138   for (i=0;i<graph->ncc;i++) {
139     PetscInt node_num=graph->queue[graph->cptr[i]];
140     PetscBool printcc = PETSC_FALSE;
141     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"  cc %d (size %d, fid %d, neighs:",i,graph->cptr[i+1]-graph->cptr[i],graph->which_dof[node_num]);CHKERRQ(ierr);
142     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_FALSE);CHKERRQ(ierr);
143     for (j=0;j<graph->count[node_num];j++) {
144       ierr = PetscViewerASCIISynchronizedPrintf(viewer," %d",graph->neighbours_set[node_num][j]);CHKERRQ(ierr);
145     }
146     if (verbosity_level > 1) {
147       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"):");CHKERRQ(ierr);
148       if (graph->twodim || graph->count[node_num] > 1 || (graph->count[node_num] == 1 && graph->special_dof[node_num] == PCBDDCGRAPH_NEUMANN_MARK)) {
149         printcc = PETSC_TRUE;
150       }
151       if (printcc) {
152         for (j=graph->cptr[i];j<graph->cptr[i+1];j++) {
153           ierr = PetscViewerASCIISynchronizedPrintf(viewer," %d (%d)",graph->queue[j],queue_in_global_numbering[j]);CHKERRQ(ierr);
154         }
155       }
156     } else {
157       ierr = PetscViewerASCIISynchronizedPrintf(viewer,")");CHKERRQ(ierr);
158     }
159     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");CHKERRQ(ierr);
160     ierr = PetscViewerASCIISetTab(viewer,tabs);CHKERRQ(ierr);
161     ierr = PetscViewerASCIIUseTabs(viewer,PETSC_TRUE);CHKERRQ(ierr);
162   }
163   ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
164   ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
165   PetscFunctionReturn(0);
166 }
167 
168 #undef __FUNCT__
169 #define __FUNCT__ "PCBDDCGraphRestoreCandidatesIS"
170 PetscErrorCode PCBDDCGraphRestoreCandidatesIS(PCBDDCGraph graph, PetscInt *n_faces, IS *FacesIS[], PetscInt *n_edges, IS *EdgesIS[], IS *VerticesIS)
171 {
172   PetscInt       i;
173   PetscErrorCode ierr;
174 
175   PetscFunctionBegin;
176   if (n_faces) {
177     if (FacesIS) {
178       for (i=0;i<*n_faces;i++) {
179         ierr = ISDestroy(&((*FacesIS)[i]));CHKERRQ(ierr);
180       }
181       ierr = PetscFree(*FacesIS);CHKERRQ(ierr);
182     }
183     *n_faces = 0;
184   }
185   if (n_edges) {
186     if (EdgesIS) {
187       for (i=0;i<*n_edges;i++) {
188         ierr = ISDestroy(&((*EdgesIS)[i]));CHKERRQ(ierr);
189       }
190       ierr = PetscFree(*EdgesIS);CHKERRQ(ierr);
191     }
192     *n_edges = 0;
193   }
194   if (VerticesIS) {
195     ierr = ISDestroy(VerticesIS);CHKERRQ(ierr);
196   }
197   PetscFunctionReturn(0);
198 }
199 
200 #undef __FUNCT__
201 #define __FUNCT__ "PCBDDCGraphGetCandidatesIS"
202 PetscErrorCode PCBDDCGraphGetCandidatesIS(PCBDDCGraph graph, PetscInt *n_faces, IS *FacesIS[], PetscInt *n_edges, IS *EdgesIS[], IS *VerticesIS)
203 {
204   IS             *ISForFaces,*ISForEdges,ISForVertices;
205   PetscInt       i,nfc,nec,nvc,*idx,*mark;
206   PetscErrorCode ierr;
207 
208   PetscFunctionBegin;
209   ierr = PetscCalloc1(graph->ncc,&mark);CHKERRQ(ierr);
210   /* loop on ccs to evalute number of faces, edges and vertices */
211   nfc = 0;
212   nec = 0;
213   nvc = 0;
214   for (i=0;i<graph->ncc;i++) {
215     PetscInt repdof = graph->queue[graph->cptr[i]];
216     if (graph->cptr[i+1]-graph->cptr[i] > graph->custom_minimal_size && graph->count[repdof] < graph->maxcount) {
217       if (!graph->twodim && graph->count[repdof] == 1 && graph->special_dof[repdof] != PCBDDCGRAPH_NEUMANN_MARK) {
218         nfc++;
219         mark[i] = 2;
220       } else {
221         nec++;
222         mark[i] = 1;
223       }
224     } else {
225       nvc += graph->cptr[i+1]-graph->cptr[i];
226     }
227   }
228 
229   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
230   if (FacesIS) {
231     ierr = PetscMalloc1(nfc,&ISForFaces);CHKERRQ(ierr);
232   }
233   if (EdgesIS) {
234     ierr = PetscMalloc1(nec,&ISForEdges);CHKERRQ(ierr);
235   }
236   if (VerticesIS) {
237     ierr = PetscMalloc1(nvc,&idx);CHKERRQ(ierr);
238   }
239 
240   /* loop on ccs to compute index sets for faces and edges */
241   if (!graph->queue_sorted) {
242     PetscInt *queue_global;
243 
244     ierr = PetscMalloc1(graph->cptr[graph->ncc],&queue_global);CHKERRQ(ierr);
245     ierr = ISLocalToGlobalMappingApply(graph->l2gmap,graph->cptr[graph->ncc],graph->queue,queue_global);CHKERRQ(ierr);
246     for (i=0;i<graph->ncc;i++) {
247       ierr = PetscSortIntWithArray(graph->cptr[i+1]-graph->cptr[i],&queue_global[graph->cptr[i]],&graph->queue[graph->cptr[i]]);CHKERRQ(ierr);
248     }
249     ierr = PetscFree(queue_global);CHKERRQ(ierr);
250     graph->queue_sorted = PETSC_TRUE;
251   }
252   nfc = 0;
253   nec = 0;
254   for (i=0;i<graph->ncc;i++) {
255     if (mark[i] == 2) {
256       if (FacesIS) {
257         ierr = ISCreateGeneral(PETSC_COMM_SELF,graph->cptr[i+1]-graph->cptr[i],&graph->queue[graph->cptr[i]],PETSC_USE_POINTER,&ISForFaces[nfc]);CHKERRQ(ierr);
258       }
259       nfc++;
260     } else if (mark[i] == 1) {
261       if (EdgesIS) {
262         ierr = ISCreateGeneral(PETSC_COMM_SELF,graph->cptr[i+1]-graph->cptr[i],&graph->queue[graph->cptr[i]],PETSC_USE_POINTER,&ISForEdges[nec]);CHKERRQ(ierr);
263       }
264       nec++;
265     }
266   }
267 
268   /* index set for vertices */
269   if (VerticesIS) {
270     nvc = 0;
271     for (i=0;i<graph->ncc;i++) {
272       if (!mark[i]) {
273         PetscInt j;
274 
275         for (j=graph->cptr[i];j<graph->cptr[i+1];j++) {
276           idx[nvc]=graph->queue[j];
277           nvc++;
278         }
279       }
280     }
281     /* sort vertex set (by local ordering) */
282     ierr = PetscSortInt(nvc,idx);CHKERRQ(ierr);
283     ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,idx,PETSC_OWN_POINTER,&ISForVertices);CHKERRQ(ierr);
284   }
285   ierr = PetscFree(mark);CHKERRQ(ierr);
286 
287   /* get back info */
288   if (n_faces)       *n_faces = nfc;
289   if (FacesIS)       *FacesIS = ISForFaces;
290   if (n_edges)       *n_edges = nec;
291   if (EdgesIS)       *EdgesIS = ISForEdges;
292   if (VerticesIS) *VerticesIS = ISForVertices;
293   PetscFunctionReturn(0);
294 }
295 
296 #undef __FUNCT__
297 #define __FUNCT__ "PCBDDCGraphComputeConnectedComponents"
298 PetscErrorCode PCBDDCGraphComputeConnectedComponents(PCBDDCGraph graph)
299 {
300   PetscBool      adapt_interface_reduced;
301   MPI_Comm       interface_comm;
302   PetscMPIInt    size;
303   PetscInt       i;
304   PetscErrorCode ierr;
305 
306   PetscFunctionBegin;
307   /* compute connected components locally */
308   ierr = PetscObjectGetComm((PetscObject)(graph->l2gmap),&interface_comm);CHKERRQ(ierr);
309   ierr = PCBDDCGraphComputeConnectedComponentsLocal(graph);CHKERRQ(ierr);
310   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
311   ierr = MPI_Comm_size(interface_comm,&size);CHKERRQ(ierr);
312   adapt_interface_reduced = PETSC_FALSE;
313   if (size > 1) {
314     PetscInt i;
315     PetscBool adapt_interface = PETSC_FALSE;
316     for (i=0;i<graph->n_subsets;i++) {
317       /* We are not sure that on a given subset of the local interface,
318          with two connected components, the latters be the same among sharing subdomains */
319       if (graph->subset_ncc[i] > 1) {
320         adapt_interface = PETSC_TRUE;
321         break;
322       }
323     }
324     ierr = MPIU_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_BOOL,MPI_LOR,interface_comm);CHKERRQ(ierr);
325   }
326 
327   if (graph->n_subsets && adapt_interface_reduced) {
328     PetscBT     subset_cc_adapt;
329     MPI_Request *send_requests,*recv_requests;
330     PetscInt    *send_buffer,*recv_buffer;
331     PetscInt    sum_requests,start_of_recv,start_of_send;
332     PetscInt    *cum_recv_counts;
333     PetscInt    *labels;
334     PetscInt    ncc,cum_queue,mss,mns,j,k,s;
335     PetscInt    **refine_buffer=NULL,*private_labels = NULL;
336 
337     ierr = PetscMalloc1(graph->nvtxs,&labels);CHKERRQ(ierr);
338     ierr = PetscMemzero(labels,graph->nvtxs*sizeof(*labels));CHKERRQ(ierr);
339     for (i=0;i<graph->ncc;i++)
340       for (j=graph->cptr[i];j<graph->cptr[i+1];j++)
341         labels[graph->queue[j]] = i;
342 
343     /* allocate some space */
344     ierr = PetscMalloc1(graph->n_subsets+1,&cum_recv_counts);CHKERRQ(ierr);
345     ierr = PetscMemzero(cum_recv_counts,(graph->n_subsets+1)*sizeof(*cum_recv_counts));CHKERRQ(ierr);
346 
347     /* first count how many neighbours per connected component I will receive from */
348     cum_recv_counts[0] = 0;
349     for (i=0;i<graph->n_subsets;i++) cum_recv_counts[i+1] = cum_recv_counts[i]+graph->count[graph->subset_idxs[i][0]];
350     ierr = PetscMalloc1(cum_recv_counts[graph->n_subsets],&recv_buffer);CHKERRQ(ierr);
351     ierr = PetscMalloc2(cum_recv_counts[graph->n_subsets],&send_requests,cum_recv_counts[graph->n_subsets],&recv_requests);CHKERRQ(ierr);
352     for (i=0;i<cum_recv_counts[graph->n_subsets];i++) {
353       send_requests[i] = MPI_REQUEST_NULL;
354       recv_requests[i] = MPI_REQUEST_NULL;
355     }
356 
357     /* exchange with my neighbours the number of my connected components on the subset of interface */
358     sum_requests = 0;
359     for (i=0;i<graph->n_subsets;i++) {
360       PetscMPIInt neigh,tag;
361       PetscInt    count,*neighs;
362 
363       count = graph->count[graph->subset_idxs[i][0]];
364       neighs = graph->neighbours_set[graph->subset_idxs[i][0]];
365       ierr = PetscMPIIntCast(2*graph->subset_ref_node[i],&tag);CHKERRQ(ierr);
366       for (k=0;k<count;k++) {
367         ierr = PetscMPIIntCast(neighs[k],&neigh);CHKERRQ(ierr);
368         ierr = MPI_Isend(&graph->subset_ncc[i],1,MPIU_INT,neigh,tag,interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
369         ierr = MPI_Irecv(&recv_buffer[sum_requests],1,MPIU_INT,neigh,tag,interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
370         sum_requests++;
371       }
372     }
373     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
374     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
375 
376     /* determine the subsets I have to adapt (those having more than 1 cc) */
377     ierr = PetscBTCreate(graph->n_subsets,&subset_cc_adapt);CHKERRQ(ierr);
378     ierr = PetscBTMemzero(graph->n_subsets,subset_cc_adapt);CHKERRQ(ierr);
379     for (i=0;i<graph->n_subsets;i++) {
380       if (graph->subset_ncc[i] > 1) {
381         ierr = PetscBTSet(subset_cc_adapt,i);CHKERRQ(ierr);
382         continue;
383       }
384       for (j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){
385          if (recv_buffer[j] > 1) {
386           ierr = PetscBTSet(subset_cc_adapt,i);CHKERRQ(ierr);
387           break;
388         }
389       }
390     }
391     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
392 
393     /* determine send/recv buffers sizes */
394     j = 0;
395     mss = 0;
396     for (i=0;i<graph->n_subsets;i++) {
397       if (PetscBTLookup(subset_cc_adapt,i)) {
398         j += graph->subset_size[i];
399         mss = PetscMax(graph->subset_size[i],mss);
400       }
401     }
402     k = 0;
403     mns = 0;
404     for (i=0;i<graph->n_subsets;i++) {
405       if (PetscBTLookup(subset_cc_adapt,i)) {
406         k += (cum_recv_counts[i+1]-cum_recv_counts[i])*graph->subset_size[i];
407         mns = PetscMax(cum_recv_counts[i+1]-cum_recv_counts[i],mns);
408       }
409     }
410     ierr = PetscMalloc2(j,&send_buffer,k,&recv_buffer);CHKERRQ(ierr);
411 
412     /* fill send buffer (order matters: subset_idxs ordered by global ordering) */
413     j = 0;
414     for (i=0;i<graph->n_subsets;i++)
415       if (PetscBTLookup(subset_cc_adapt,i))
416         for (k=0;k<graph->subset_size[i];k++)
417           send_buffer[j++] = labels[graph->subset_idxs[i][k]];
418 
419     /* now exchange the data */
420     start_of_recv = 0;
421     start_of_send = 0;
422     sum_requests = 0;
423     for (i=0;i<graph->n_subsets;i++) {
424       if (PetscBTLookup(subset_cc_adapt,i)) {
425         PetscMPIInt neigh,tag;
426         PetscInt    size_of_send = graph->subset_size[i];
427 
428         j = graph->subset_idxs[i][0];
429         ierr = PetscMPIIntCast(2*graph->subset_ref_node[i]+1,&tag);CHKERRQ(ierr);
430         for (k=0;k<graph->count[j];k++) {
431           ierr = PetscMPIIntCast(graph->neighbours_set[j][k],&neigh);CHKERRQ(ierr);
432           ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,neigh,tag,interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
433           ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_send,MPIU_INT,neigh,tag,interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
434           start_of_recv += size_of_send;
435           sum_requests++;
436         }
437         start_of_send += size_of_send;
438       }
439     }
440     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
441 
442     /* refine connected components */
443     start_of_recv = 0;
444     /* allocate some temporary space */
445     if (mss) {
446       ierr = PetscMalloc1(mss,&refine_buffer);CHKERRQ(ierr);
447       ierr = PetscMalloc2(mss*(mns+1),&refine_buffer[0],mss,&private_labels);CHKERRQ(ierr);
448     }
449     ncc = 0;
450     cum_queue = 0;
451     graph->cptr[0] = 0;
452     for (i=0;i<graph->n_subsets;i++) {
453       if (PetscBTLookup(subset_cc_adapt,i)) {
454         PetscInt subset_counter = 0;
455         PetscInt sharingprocs = cum_recv_counts[i+1]-cum_recv_counts[i]+1; /* count myself */
456         PetscInt buffer_size = graph->subset_size[i];
457 
458         /* compute pointers */
459         for (j=1;j<buffer_size;j++) refine_buffer[j] = refine_buffer[j-1] + sharingprocs;
460         /* analyze contributions from subdomains that share the i-th subset
461            The stricture of refine_buffer is suitable to find intersections of ccs among sharingprocs.
462            supposing the current subset is shared by 3 processes and has dimension 5 with global dofs 0,1,2,3,4 (local 0,4,3,1,2)
463            sharing procs connected components:
464              neigh 0: [0 1 4], [2 3], labels [4,7]  (2 connected components)
465              neigh 1: [0 1], [2 3 4], labels [3 2]  (2 connected components)
466              neigh 2: [0 4], [1], [2 3], labels [1 5 6] (3 connected components)
467            refine_buffer will be filled as:
468              [ 4, 3, 1;
469                4, 2, 1;
470                7, 2, 6;
471                4, 3, 5;
472                7, 2, 6; ];
473            The connected components in local ordering are [0], [1], [2 3], [4] */
474         /* fill temp_buffer */
475         for (k=0;k<buffer_size;k++) refine_buffer[k][0] = labels[graph->subset_idxs[i][k]];
476         for (j=0;j<sharingprocs-1;j++) {
477           for (k=0;k<buffer_size;k++) refine_buffer[k][j+1] = recv_buffer[start_of_recv+k];
478           start_of_recv += buffer_size;
479         }
480         ierr = PetscMemzero(private_labels,buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
481         for (j=0;j<buffer_size;j++) {
482           if (!private_labels[j]) { /* found a new cc  */
483             PetscBool same_set;
484 
485             graph->cptr[ncc] = cum_queue;
486             ncc++;
487             subset_counter++;
488             private_labels[j] = subset_counter;
489             graph->queue[cum_queue++] = graph->subset_idxs[i][j];
490             for (k=j+1;k<buffer_size;k++) { /* check for other nodes in new cc */
491               same_set = PETSC_TRUE;
492               for (s=0;s<sharingprocs;s++) {
493                 if (refine_buffer[j][s] != refine_buffer[k][s]) {
494                   same_set = PETSC_FALSE;
495                   break;
496                 }
497               }
498               if (same_set) {
499                 private_labels[k] = subset_counter;
500                 graph->queue[cum_queue++] = graph->subset_idxs[i][k];
501               }
502             }
503           }
504         }
505         graph->cptr[ncc] = cum_queue;
506         graph->subset_ncc[i] = subset_counter;
507         graph->queue_sorted = PETSC_FALSE;
508       } else { /* this subset does not need to be adapted */
509         ierr = PetscMemcpy(graph->queue+cum_queue,graph->subset_idxs[i],graph->subset_size[i]*sizeof(PetscInt));CHKERRQ(ierr);
510         ncc++;
511         cum_queue += graph->subset_size[i];
512         graph->cptr[ncc] = cum_queue;
513       }
514     }
515     graph->cptr[ncc] = cum_queue;
516     graph->ncc = ncc;
517     if (mss) {
518       ierr = PetscFree2(refine_buffer[0],private_labels);CHKERRQ(ierr);
519       ierr = PetscFree(refine_buffer);CHKERRQ(ierr);
520     }
521     ierr = PetscFree(labels);CHKERRQ(ierr);
522     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
523     ierr = PetscFree2(send_requests,recv_requests);CHKERRQ(ierr);
524     ierr = PetscFree2(send_buffer,recv_buffer);CHKERRQ(ierr);
525     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
526     ierr = PetscBTDestroy(&subset_cc_adapt);CHKERRQ(ierr);
527   }
528 
529   /* Determine if we are in 2D or 3D */
530   if (!graph->twodimset) {
531     PetscBool twodim = PETSC_TRUE;
532     for (i=0;i<graph->ncc;i++) {
533       PetscInt repdof = graph->queue[graph->cptr[i]];
534       PetscInt ccsize = graph->cptr[i+1]-graph->cptr[i];
535       if (graph->count[repdof] > 1 && ccsize > graph->custom_minimal_size) {
536         twodim = PETSC_FALSE;
537         break;
538       }
539     }
540     ierr = MPIU_Allreduce(&twodim,&graph->twodim,1,MPIU_BOOL,MPI_LAND,PetscObjectComm((PetscObject)graph->l2gmap));CHKERRQ(ierr);
541     graph->twodimset = PETSC_TRUE;
542   }
543   PetscFunctionReturn(0);
544 }
545 
546 
547 #undef __FUNCT__
548 #define __FUNCT__ "PCBDDCGraphComputeCC_Private"
549 PETSC_STATIC_INLINE PetscErrorCode PCBDDCGraphComputeCC_Private(PCBDDCGraph graph,PetscInt pid,PetscInt* queue_tip,PetscInt n_prev,PetscInt* n_added)
550 {
551   PetscInt       i,j,n;
552   PetscInt       *xadj = graph->xadj,*adjncy = graph->adjncy;
553   PetscBT        touched = graph->touched;
554   PetscBool      havecsr = (PetscBool)(!!xadj);
555   PetscBool      havesubs = (PetscBool)(!!graph->n_local_subs);
556   PetscErrorCode ierr;
557 
558   PetscFunctionBegin;
559   n = 0;
560   if (havecsr && !havesubs) {
561     for (i=-n_prev;i<0;i++) {
562       PetscInt start_dof = queue_tip[i];
563       /* we assume that if a dof has a size 1 adjacency list and the corresponding entry is negative, it is connected to all dofs */
564       if (xadj[start_dof+1]-xadj[start_dof] == 1 && adjncy[xadj[start_dof]] < 0) {
565         for (j=0;j<graph->subset_size[pid-1];j++) { /* pid \in [1,graph->n_subsets] */
566           PetscInt dof = graph->subset_idxs[pid-1][j];
567           if (!PetscBTLookup(touched,dof) && graph->subset[dof] == pid) {
568             ierr = PetscBTSet(touched,dof);CHKERRQ(ierr);
569             queue_tip[n] = dof;
570             n++;
571           }
572         }
573       } else {
574         for (j=xadj[start_dof];j<xadj[start_dof+1];j++) {
575           PetscInt dof = adjncy[j];
576           if (!PetscBTLookup(touched,dof) && graph->subset[dof] == pid) {
577             ierr = PetscBTSet(touched,dof);CHKERRQ(ierr);
578             queue_tip[n] = dof;
579             n++;
580           }
581         }
582       }
583     }
584   } else if (havecsr && havesubs) {
585     PetscInt sid = graph->local_subs[queue_tip[-n_prev]];
586     for (i=-n_prev;i<0;i++) {
587       PetscInt start_dof = queue_tip[i];
588       /* we assume that if a dof has a size 1 adjacency list and the corresponding entry is negative, it is connected to all dofs belonging to the local sub */
589       if (xadj[start_dof+1]-xadj[start_dof] == 1 && adjncy[xadj[start_dof]] < 0) {
590         for (j=0;j<graph->subset_size[pid-1];j++) { /* pid \in [1,graph->n_subsets] */
591           PetscInt dof = graph->subset_idxs[pid-1][j];
592           if (!PetscBTLookup(touched,dof) && graph->subset[dof] == pid && graph->local_subs[dof] == sid) {
593             ierr = PetscBTSet(touched,dof);CHKERRQ(ierr);
594             queue_tip[n] = dof;
595             n++;
596           }
597         }
598       } else {
599         for (j=xadj[start_dof];j<xadj[start_dof+1];j++) {
600           PetscInt dof = adjncy[j];
601           if (!PetscBTLookup(touched,dof) && graph->subset[dof] == pid && graph->local_subs[dof] == sid) {
602             ierr = PetscBTSet(touched,dof);CHKERRQ(ierr);
603             queue_tip[n] = dof;
604             n++;
605           }
606         }
607       }
608     }
609   } else { /* sub info only */
610     PetscInt sid = graph->local_subs[queue_tip[-n_prev]];
611     for (j=0;j<graph->subset_size[pid-1];j++) { /* pid \in [1,graph->n_subsets] */
612       PetscInt dof = graph->subset_idxs[pid-1][j];
613       if (!PetscBTLookup(touched,dof) && graph->subset[dof] == pid && graph->local_subs[dof] == sid) {
614         ierr = PetscBTSet(touched,dof);CHKERRQ(ierr);
615         queue_tip[n] = dof;
616         n++;
617       }
618     }
619   }
620   *n_added = n;
621   PetscFunctionReturn(0);
622 }
623 
624 #undef __FUNCT__
625 #define __FUNCT__ "PCBDDCGraphComputeConnectedComponentsLocal"
626 PetscErrorCode PCBDDCGraphComputeConnectedComponentsLocal(PCBDDCGraph graph)
627 {
628   PetscInt       ncc,cum_queue,n;
629   PetscMPIInt    commsize;
630   PetscErrorCode ierr;
631 
632   PetscFunctionBegin;
633   if (!graph->setupcalled) SETERRQ(PetscObjectComm((PetscObject)graph->l2gmap),PETSC_ERR_ORDER,"PCBDDCGraphSetUp should be called first");
634   /* quiet return if there isn't any local info */
635   if (!graph->xadj && !graph->n_local_subs) {
636     PetscFunctionReturn(0);
637   }
638 
639   /* reset any previous search of connected components */
640   ierr = PetscBTMemzero(graph->nvtxs,graph->touched);CHKERRQ(ierr);
641   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)graph->l2gmap),&commsize);CHKERRQ(ierr);
642   if (commsize > graph->commsizelimit) {
643     PetscInt i;
644     for (i=0;i<graph->nvtxs;i++) {
645       if (graph->special_dof[i] == PCBDDCGRAPH_DIRICHLET_MARK || !graph->count[i]) {
646         ierr = PetscBTSet(graph->touched,i);CHKERRQ(ierr);
647       }
648     }
649   }
650 
651   /* begin search for connected components */
652   cum_queue = 0;
653   ncc = 0;
654   for (n=0;n<graph->n_subsets;n++) {
655     PetscInt pid = n+1;  /* partition labeled by 0 is discarded */
656     PetscInt found = 0,prev = 0,first = 0,ncc_pid = 0;
657     while (found != graph->subset_size[n]) {
658       PetscInt added = 0;
659       if (!prev) { /* search for new starting dof */
660         while (PetscBTLookup(graph->touched,graph->subset_idxs[n][first])) first++;
661         ierr = PetscBTSet(graph->touched,graph->subset_idxs[n][first]);CHKERRQ(ierr);
662         graph->queue[cum_queue] = graph->subset_idxs[n][first];
663         graph->cptr[ncc] = cum_queue;
664         prev = 1;
665         cum_queue++;
666         found++;
667         ncc_pid++;
668         ncc++;
669       }
670       ierr = PCBDDCGraphComputeCC_Private(graph,pid,graph->queue + cum_queue,prev,&added);CHKERRQ(ierr);
671       if (!added) {
672         graph->subset_ncc[n] = ncc_pid;
673         graph->cptr[ncc] = cum_queue;
674       }
675       prev = added;
676       found += added;
677       cum_queue += added;
678       if (added && found == graph->subset_size[n]) {
679         graph->subset_ncc[n] = ncc_pid;
680         graph->cptr[ncc] = cum_queue;
681       }
682     }
683   }
684   graph->ncc = ncc;
685   graph->queue_sorted = PETSC_FALSE;
686   PetscFunctionReturn(0);
687 }
688 
689 #undef __FUNCT__
690 #define __FUNCT__ "PCBDDCGraphSetUp"
691 PetscErrorCode PCBDDCGraphSetUp(PCBDDCGraph graph, PetscInt custom_minimal_size, IS neumann_is, IS dirichlet_is, PetscInt n_ISForDofs, IS ISForDofs[], IS custom_primal_vertices)
692 {
693   IS             subset,subset_n;
694   MPI_Comm       comm;
695   const PetscInt *is_indices;
696   PetscInt       n_neigh,*neigh,*n_shared,**shared,*queue_global;
697   PetscInt       i,j,k,s,total_counts,nodes_touched,is_size;
698   PetscMPIInt    commsize;
699   PetscBool      same_set,mirrors_found;
700   PetscErrorCode ierr;
701 
702   PetscFunctionBegin;
703   PetscValidLogicalCollectiveInt(graph->l2gmap,custom_minimal_size,2);
704   if (neumann_is) {
705     PetscValidHeaderSpecific(neumann_is,IS_CLASSID,3);
706     PetscCheckSameComm(graph->l2gmap,1,neumann_is,3);
707   }
708   graph->has_dirichlet = PETSC_FALSE;
709   if (dirichlet_is) {
710     PetscValidHeaderSpecific(dirichlet_is,IS_CLASSID,4);
711     PetscCheckSameComm(graph->l2gmap,1,dirichlet_is,4);
712     graph->has_dirichlet = PETSC_TRUE;
713   }
714   PetscValidLogicalCollectiveInt(graph->l2gmap,n_ISForDofs,5);
715   for (i=0;i<n_ISForDofs;i++) {
716     PetscValidHeaderSpecific(ISForDofs[i],IS_CLASSID,6);
717     PetscCheckSameComm(graph->l2gmap,1,ISForDofs[i],6);
718   }
719   if (custom_primal_vertices) {
720     PetscValidHeaderSpecific(custom_primal_vertices,IS_CLASSID,6);
721     PetscCheckSameComm(graph->l2gmap,1,custom_primal_vertices,7);
722   }
723   ierr = PetscObjectGetComm((PetscObject)(graph->l2gmap),&comm);CHKERRQ(ierr);
724   ierr = MPI_Comm_size(comm,&commsize);CHKERRQ(ierr);
725 
726   /* custom_minimal_size */
727   graph->custom_minimal_size = custom_minimal_size;
728   /* get info l2gmap and allocate work vectors  */
729   ierr = ISLocalToGlobalMappingGetInfo(graph->l2gmap,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr);
730   /* check if we have any local periodic nodes (periodic BCs) */
731   mirrors_found = PETSC_FALSE;
732   if (graph->nvtxs && n_neigh) {
733     for (i=0; i<n_shared[0]; i++) graph->count[shared[0][i]] += 1;
734     for (i=0; i<n_shared[0]; i++) {
735       if (graph->count[shared[0][i]] > 1) {
736         mirrors_found = PETSC_TRUE;
737         break;
738       }
739     }
740   }
741   /* compute local mirrors (if any) */
742   if (mirrors_found) {
743     IS       to,from;
744     PetscInt *local_indices,*global_indices;
745 
746     ierr = ISCreateStride(PETSC_COMM_SELF,graph->nvtxs,0,1,&to);CHKERRQ(ierr);
747     ierr = ISLocalToGlobalMappingApplyIS(graph->l2gmap,to,&from);CHKERRQ(ierr);
748     /* get arrays of local and global indices */
749     ierr = PetscMalloc1(graph->nvtxs,&local_indices);CHKERRQ(ierr);
750     ierr = ISGetIndices(to,(const PetscInt**)&is_indices);CHKERRQ(ierr);
751     ierr = PetscMemcpy(local_indices,is_indices,graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
752     ierr = ISRestoreIndices(to,(const PetscInt**)&is_indices);CHKERRQ(ierr);
753     ierr = PetscMalloc1(graph->nvtxs,&global_indices);CHKERRQ(ierr);
754     ierr = ISGetIndices(from,(const PetscInt**)&is_indices);CHKERRQ(ierr);
755     ierr = PetscMemcpy(global_indices,is_indices,graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
756     ierr = ISRestoreIndices(from,(const PetscInt**)&is_indices);CHKERRQ(ierr);
757     /* allocate space for mirrors */
758     ierr = PetscMalloc2(graph->nvtxs,&graph->mirrors,graph->nvtxs,&graph->mirrors_set);CHKERRQ(ierr);
759     ierr = PetscMemzero(graph->mirrors,graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
760     graph->mirrors_set[0] = 0;
761 
762     k=0;
763     for (i=0;i<n_shared[0];i++) {
764       j=shared[0][i];
765       if (graph->count[j] > 1) {
766         graph->mirrors[j]++;
767         k++;
768       }
769     }
770     /* allocate space for set of mirrors */
771     ierr = PetscMalloc1(k,&graph->mirrors_set[0]);CHKERRQ(ierr);
772     for (i=1;i<graph->nvtxs;i++)
773       graph->mirrors_set[i]=graph->mirrors_set[i-1]+graph->mirrors[i-1];
774 
775     /* fill arrays */
776     ierr = PetscMemzero(graph->mirrors,graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
777     for (j=0;j<n_shared[0];j++) {
778       i=shared[0][j];
779       if (graph->count[i] > 1)
780         graph->mirrors_set[i][graph->mirrors[i]++]=global_indices[i];
781     }
782     ierr = PetscSortIntWithArray(graph->nvtxs,global_indices,local_indices);CHKERRQ(ierr);
783     for (i=0;i<graph->nvtxs;i++) {
784       if (graph->mirrors[i] > 0) {
785         ierr = PetscFindInt(graph->mirrors_set[i][0],graph->nvtxs,global_indices,&k);CHKERRQ(ierr);
786         j = global_indices[k];
787         while ( k > 0 && global_indices[k-1] == j) k--;
788         for (j=0;j<graph->mirrors[i];j++) {
789           graph->mirrors_set[i][j]=local_indices[k+j];
790         }
791         ierr = PetscSortInt(graph->mirrors[i],graph->mirrors_set[i]);CHKERRQ(ierr);
792       }
793     }
794     ierr = PetscFree(local_indices);CHKERRQ(ierr);
795     ierr = PetscFree(global_indices);CHKERRQ(ierr);
796     ierr = ISDestroy(&to);CHKERRQ(ierr);
797     ierr = ISDestroy(&from);CHKERRQ(ierr);
798   }
799   ierr = PetscMemzero(graph->count,graph->nvtxs*sizeof(*graph->count));CHKERRQ(ierr);
800 
801   /* Count total number of neigh per node */
802   k = 0;
803   for (i=1;i<n_neigh;i++) {
804     k += n_shared[i];
805     for (j=0;j<n_shared[i];j++) {
806       graph->count[shared[i][j]] += 1;
807     }
808   }
809   /* Allocate space for storing the set of neighbours for each node */
810   if (graph->nvtxs) {
811     ierr = PetscMalloc1(k,&graph->neighbours_set[0]);CHKERRQ(ierr);
812   }
813   for (i=1;i<graph->nvtxs;i++) { /* dont count myself */
814     graph->neighbours_set[i]=graph->neighbours_set[i-1]+graph->count[i-1];
815   }
816   /* Get information for sharing subdomains */
817   ierr = PetscMemzero(graph->count,graph->nvtxs*sizeof(*graph->count));CHKERRQ(ierr);
818   for (i=1;i<n_neigh;i++) { /* dont count myself */
819     s = n_shared[i];
820     for (j=0;j<s;j++) {
821       k = shared[i][j];
822       graph->neighbours_set[k][graph->count[k]] = neigh[i];
823       graph->count[k] += 1;
824     }
825   }
826   /* sort set of sharing subdomains */
827   for (i=0;i<graph->nvtxs;i++) {
828     ierr = PetscSortRemoveDupsInt(&graph->count[i],graph->neighbours_set[i]);CHKERRQ(ierr);
829   }
830   /* free memory allocated by ISLocalToGlobalMappingGetInfo */
831   ierr = ISLocalToGlobalMappingRestoreInfo(graph->l2gmap,&n_neigh,&neigh,&n_shared,&shared);CHKERRQ(ierr);
832 
833   /*
834      Get info for dofs splitting
835      User can specify just a subset; an additional field is considered as a complementary field
836   */
837   for (i=0;i<graph->nvtxs;i++) graph->which_dof[i] = n_ISForDofs; /* by default a dof belongs to the complement set */
838   for (i=0;i<n_ISForDofs;i++) {
839     ierr = ISGetLocalSize(ISForDofs[i],&is_size);CHKERRQ(ierr);
840     ierr = ISGetIndices(ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
841     for (j=0;j<is_size;j++) {
842       if (is_indices[j] > -1 && is_indices[j] < graph->nvtxs) { /* out of bounds indices (if any) are skipped */
843         graph->which_dof[is_indices[j]] = i;
844       }
845     }
846     ierr = ISRestoreIndices(ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
847   }
848 
849   /* Take into account Neumann nodes */
850   if (neumann_is) {
851     ierr = ISGetLocalSize(neumann_is,&is_size);CHKERRQ(ierr);
852     ierr = ISGetIndices(neumann_is,(const PetscInt**)&is_indices);CHKERRQ(ierr);
853     for (i=0;i<is_size;i++) {
854       if (is_indices[i] > -1 && is_indices[i] < graph->nvtxs) { /* out of bounds indices (if any) are skipped */
855         graph->special_dof[is_indices[i]] = PCBDDCGRAPH_NEUMANN_MARK;
856       }
857     }
858     ierr = ISRestoreIndices(neumann_is,(const PetscInt**)&is_indices);CHKERRQ(ierr);
859   }
860   /* Take into account Dirichlet nodes (they overwrite any neumann boundary mark previously set) */
861   if (dirichlet_is) {
862     ierr = ISGetLocalSize(dirichlet_is,&is_size);CHKERRQ(ierr);
863     ierr = ISGetIndices(dirichlet_is,(const PetscInt**)&is_indices);CHKERRQ(ierr);
864     for (i=0;i<is_size;i++){
865       if (is_indices[i] > -1 && is_indices[i] < graph->nvtxs) { /* out of bounds indices (if any) are skipped */
866         if (commsize > graph->commsizelimit) { /* dirichlet nodes treated as internal */
867           ierr = PetscBTSet(graph->touched,is_indices[i]);CHKERRQ(ierr);
868           graph->subset[is_indices[i]] = 0;
869         }
870         graph->special_dof[is_indices[i]] = PCBDDCGRAPH_DIRICHLET_MARK;
871       }
872     }
873     ierr = ISRestoreIndices(dirichlet_is,(const PetscInt**)&is_indices);CHKERRQ(ierr);
874   }
875   /* mark local periodic nodes (if any) and adapt CSR graph (if any) */
876   if (graph->mirrors) {
877     for (i=0;i<graph->nvtxs;i++)
878       if (graph->mirrors[i])
879         graph->special_dof[i] = PCBDDCGRAPH_LOCAL_PERIODIC_MARK;
880 
881     if (graph->xadj) {
882       PetscInt *new_xadj,*new_adjncy;
883       /* sort CSR graph */
884       for (i=0;i<graph->nvtxs;i++)
885         ierr = PetscSortInt(graph->xadj[i+1]-graph->xadj[i],&graph->adjncy[graph->xadj[i]]);CHKERRQ(ierr);
886 
887       /* adapt local CSR graph in case of local periodicity */
888       k = 0;
889       for (i=0;i<graph->nvtxs;i++)
890         for (j=graph->xadj[i];j<graph->xadj[i+1];j++)
891           k += graph->mirrors[graph->adjncy[j]];
892 
893       ierr = PetscMalloc1(graph->nvtxs+1,&new_xadj);CHKERRQ(ierr);
894       ierr = PetscMalloc1(k+graph->xadj[graph->nvtxs],&new_adjncy);CHKERRQ(ierr);
895       new_xadj[0] = 0;
896       for (i=0;i<graph->nvtxs;i++) {
897         k = graph->xadj[i+1]-graph->xadj[i];
898         ierr = PetscMemcpy(&new_adjncy[new_xadj[i]],&graph->adjncy[graph->xadj[i]],k*sizeof(PetscInt));CHKERRQ(ierr);
899         new_xadj[i+1] = new_xadj[i]+k;
900         for (j=graph->xadj[i];j<graph->xadj[i+1];j++) {
901           k = graph->mirrors[graph->adjncy[j]];
902           ierr = PetscMemcpy(&new_adjncy[new_xadj[i+1]],graph->mirrors_set[graph->adjncy[j]],k*sizeof(PetscInt));CHKERRQ(ierr);
903           new_xadj[i+1] += k;
904         }
905         k = new_xadj[i+1]-new_xadj[i];
906         ierr = PetscSortRemoveDupsInt(&k,&new_adjncy[new_xadj[i]]);CHKERRQ(ierr);
907         new_xadj[i+1] = new_xadj[i]+k;
908       }
909       /* set new CSR into graph */
910       ierr = PetscFree(graph->xadj);CHKERRQ(ierr);
911       ierr = PetscFree(graph->adjncy);CHKERRQ(ierr);
912       graph->xadj = new_xadj;
913       graph->adjncy = new_adjncy;
914     }
915   }
916 
917   /* mark special nodes (if any) -> each will become a single node equivalence class */
918   if (custom_primal_vertices) {
919     ierr = ISGetLocalSize(custom_primal_vertices,&is_size);CHKERRQ(ierr);
920     ierr = ISGetIndices(custom_primal_vertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
921     for (i=0,j=0;i<is_size;i++){
922       if (is_indices[i] > -1 && is_indices[i] < graph->nvtxs  && graph->special_dof[is_indices[i]] != PCBDDCGRAPH_DIRICHLET_MARK) { /* out of bounds indices (if any) are skipped */
923         graph->special_dof[is_indices[i]] = PCBDDCGRAPH_SPECIAL_MARK-j;
924         j++;
925       }
926     }
927     ierr = ISRestoreIndices(custom_primal_vertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
928   }
929 
930   /* mark interior nodes (if commsize > graph->commsizelimit) as touched and belonging to partition number 0 */
931   if (commsize > graph->commsizelimit) {
932     for (i=0;i<graph->nvtxs;i++) {
933       if (!graph->count[i]) {
934         ierr = PetscBTSet(graph->touched,i);CHKERRQ(ierr);
935         graph->subset[i] = 0;
936       }
937     }
938   }
939 
940   /* init graph structure and compute default subsets */
941   nodes_touched = 0;
942   for (i=0;i<graph->nvtxs;i++) {
943     if (PetscBTLookup(graph->touched,i)) {
944       nodes_touched++;
945     }
946   }
947   i = 0;
948   graph->ncc = 0;
949   total_counts = 0;
950 
951   /* allocated space for queues */
952   if (commsize == graph->commsizelimit) {
953     ierr = PetscMalloc2(graph->nvtxs+1,&graph->cptr,graph->nvtxs,&graph->queue);CHKERRQ(ierr);
954   } else {
955     PetscInt nused = graph->nvtxs - nodes_touched;
956     ierr = PetscMalloc2(nused+1,&graph->cptr,nused,&graph->queue);CHKERRQ(ierr);
957   }
958 
959   while (nodes_touched<graph->nvtxs) {
960     /*  find first untouched node in local ordering */
961     while (PetscBTLookup(graph->touched,i)) i++;
962     ierr = PetscBTSet(graph->touched,i);CHKERRQ(ierr);
963     graph->subset[i] = graph->ncc+1;
964     graph->cptr[graph->ncc] = total_counts;
965     graph->queue[total_counts] = i;
966     total_counts++;
967     nodes_touched++;
968     /* now find all other nodes having the same set of sharing subdomains */
969     for (j=i+1;j<graph->nvtxs;j++) {
970       /* check for same number of sharing subdomains, dof number and same special mark */
971       if (!PetscBTLookup(graph->touched,j) && graph->count[i] == graph->count[j] && graph->which_dof[i] == graph->which_dof[j] && graph->special_dof[i] == graph->special_dof[j]) {
972         /* check for same set of sharing subdomains */
973         same_set = PETSC_TRUE;
974         for (k=0;k<graph->count[j];k++){
975           if (graph->neighbours_set[i][k] != graph->neighbours_set[j][k]) {
976             same_set = PETSC_FALSE;
977           }
978         }
979         /* I found a friend of mine */
980         if (same_set) {
981           ierr = PetscBTSet(graph->touched,j);CHKERRQ(ierr);
982           graph->subset[j] = graph->ncc+1;
983           nodes_touched++;
984           graph->queue[total_counts] = j;
985           total_counts++;
986         }
987       }
988     }
989     graph->ncc++;
990   }
991   /* set default number of subsets (at this point no info on csr and/or local_subs has been taken into account, so n_subsets = ncc */
992   graph->n_subsets = graph->ncc;
993   ierr = PetscMalloc1(graph->n_subsets,&graph->subset_ncc);CHKERRQ(ierr);
994   for (i=0;i<graph->n_subsets;i++) {
995     graph->subset_ncc[i] = 1;
996   }
997   /* final pointer */
998   graph->cptr[graph->ncc] = total_counts;
999 
1000   /* For consistency reasons (among neighbours), I need to sort (by global ordering) each connected component */
1001   /* Get a reference node (min index in global ordering) for each subset for tagging messages */
1002   ierr = PetscMalloc1(graph->ncc,&graph->subset_ref_node);CHKERRQ(ierr);
1003   ierr = PetscMalloc1(graph->cptr[graph->ncc],&queue_global);CHKERRQ(ierr);
1004   ierr = ISLocalToGlobalMappingApply(graph->l2gmap,graph->cptr[graph->ncc],graph->queue,queue_global);CHKERRQ(ierr);
1005   for (j=0;j<graph->ncc;j++) {
1006     ierr = PetscSortIntWithArray(graph->cptr[j+1]-graph->cptr[j],&queue_global[graph->cptr[j]],&graph->queue[graph->cptr[j]]);CHKERRQ(ierr);
1007     graph->subset_ref_node[j] = graph->queue[graph->cptr[j]];
1008   }
1009   ierr = PetscFree(queue_global);CHKERRQ(ierr);
1010   graph->queue_sorted = PETSC_TRUE;
1011 
1012   /* save information on subsets (needed when analyzing the connected components) */
1013   if (graph->ncc) {
1014     ierr = PetscMalloc2(graph->ncc,&graph->subset_size,graph->ncc,&graph->subset_idxs);CHKERRQ(ierr);
1015     ierr = PetscMalloc1(graph->cptr[graph->ncc],&graph->subset_idxs[0]);CHKERRQ(ierr);
1016     ierr = PetscMemzero(graph->subset_idxs[0],graph->cptr[graph->ncc]*sizeof(PetscInt));CHKERRQ(ierr);
1017     for (j=1;j<graph->ncc;j++) {
1018       graph->subset_size[j-1] = graph->cptr[j] - graph->cptr[j-1];
1019       graph->subset_idxs[j] = graph->subset_idxs[j-1] + graph->subset_size[j-1];
1020     }
1021     graph->subset_size[graph->ncc-1] = graph->cptr[graph->ncc] - graph->cptr[graph->ncc-1];
1022     ierr = PetscMemcpy(graph->subset_idxs[0],graph->queue,graph->cptr[graph->ncc]*sizeof(PetscInt));CHKERRQ(ierr);
1023   }
1024 
1025   /* renumber reference nodes */
1026   ierr = ISCreateGeneral(PetscObjectComm((PetscObject)(graph->l2gmap)),graph->ncc,graph->subset_ref_node,PETSC_COPY_VALUES,&subset_n);CHKERRQ(ierr);
1027   ierr = ISLocalToGlobalMappingApplyIS(graph->l2gmap,subset_n,&subset);CHKERRQ(ierr);
1028   ierr = ISDestroy(&subset_n);CHKERRQ(ierr);
1029   ierr = ISRenumber(subset,NULL,NULL,&subset_n);CHKERRQ(ierr);
1030   ierr = ISDestroy(&subset);CHKERRQ(ierr);
1031   ierr = ISGetLocalSize(subset_n,&k);CHKERRQ(ierr);
1032   if (k != graph->ncc) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Invalid size of new subset! %D != %D",k,graph->ncc);
1033   ierr = ISGetIndices(subset_n,&is_indices);CHKERRQ(ierr);
1034   ierr = PetscMemcpy(graph->subset_ref_node,is_indices,graph->ncc*sizeof(PetscInt));CHKERRQ(ierr);
1035   ierr = ISRestoreIndices(subset_n,&is_indices);CHKERRQ(ierr);
1036   ierr = ISDestroy(&subset_n);CHKERRQ(ierr);
1037 
1038   /* free workspace */
1039   graph->setupcalled = PETSC_TRUE;
1040   PetscFunctionReturn(0);
1041 }
1042 
1043 #undef __FUNCT__
1044 #define __FUNCT__ "PCBDDCGraphResetCSR"
1045 PetscErrorCode PCBDDCGraphResetCSR(PCBDDCGraph graph)
1046 {
1047   PetscErrorCode ierr;
1048 
1049   PetscFunctionBegin;
1050   if (!graph) PetscFunctionReturn(0);
1051   if (graph->freecsr) {
1052     ierr = PetscFree(graph->xadj);CHKERRQ(ierr);
1053     ierr = PetscFree(graph->adjncy);CHKERRQ(ierr);
1054   } else {
1055     graph->xadj = NULL;
1056     graph->adjncy = NULL;
1057   }
1058   graph->freecsr = PETSC_FALSE;
1059   graph->nvtxs_csr = 0;
1060   PetscFunctionReturn(0);
1061 }
1062 
1063 #undef __FUNCT__
1064 #define __FUNCT__ "PCBDDCGraphReset"
1065 PetscErrorCode PCBDDCGraphReset(PCBDDCGraph graph)
1066 {
1067   PetscErrorCode ierr;
1068 
1069   PetscFunctionBegin;
1070   if (!graph) PetscFunctionReturn(0);
1071   ierr = ISLocalToGlobalMappingDestroy(&graph->l2gmap);CHKERRQ(ierr);
1072   ierr = PetscFree(graph->subset_ncc);CHKERRQ(ierr);
1073   ierr = PetscFree(graph->subset_ref_node);CHKERRQ(ierr);
1074   if (graph->nvtxs) {
1075     ierr = PetscFree(graph->neighbours_set[0]);CHKERRQ(ierr);
1076   }
1077   ierr = PetscBTDestroy(&graph->touched);CHKERRQ(ierr);
1078   ierr = PetscFree5(graph->count,
1079                     graph->neighbours_set,
1080                     graph->subset,
1081                     graph->which_dof,
1082                     graph->special_dof);CHKERRQ(ierr);
1083   ierr = PetscFree2(graph->cptr,graph->queue);CHKERRQ(ierr);
1084   if (graph->mirrors) {
1085     ierr = PetscFree(graph->mirrors_set[0]);CHKERRQ(ierr);
1086   }
1087   ierr = PetscFree2(graph->mirrors,graph->mirrors_set);CHKERRQ(ierr);
1088   if (graph->subset_idxs) {
1089     ierr = PetscFree(graph->subset_idxs[0]);CHKERRQ(ierr);
1090   }
1091   ierr = PetscFree2(graph->subset_size,graph->subset_idxs);CHKERRQ(ierr);
1092   ierr = ISDestroy(&graph->dirdofs);CHKERRQ(ierr);
1093   ierr = ISDestroy(&graph->dirdofsB);CHKERRQ(ierr);
1094   if (graph->n_local_subs) {
1095     ierr = PetscFree(graph->local_subs);CHKERRQ(ierr);
1096   }
1097   graph->has_dirichlet       = PETSC_FALSE;
1098   graph->twodimset           = PETSC_FALSE;
1099   graph->twodim              = PETSC_FALSE;
1100   graph->nvtxs               = 0;
1101   graph->nvtxs_global        = 0;
1102   graph->n_subsets           = 0;
1103   graph->custom_minimal_size = 1;
1104   graph->n_local_subs        = 0;
1105   graph->maxcount            = PETSC_MAX_INT;
1106   graph->setupcalled         = PETSC_FALSE;
1107   PetscFunctionReturn(0);
1108 }
1109 
1110 #undef __FUNCT__
1111 #define __FUNCT__ "PCBDDCGraphInit"
1112 PetscErrorCode PCBDDCGraphInit(PCBDDCGraph graph, ISLocalToGlobalMapping l2gmap, PetscInt N, PetscInt maxcount)
1113 {
1114   PetscInt       n;
1115   PetscErrorCode ierr;
1116 
1117   PetscFunctionBegin;
1118   PetscValidPointer(graph,1);
1119   PetscValidHeaderSpecific(l2gmap,IS_LTOGM_CLASSID,2);
1120   PetscValidLogicalCollectiveInt(l2gmap,N,3);
1121   PetscValidLogicalCollectiveInt(l2gmap,maxcount,4);
1122   /* raise an error if already allocated */
1123   if (graph->nvtxs_global) SETERRQ(PetscObjectComm((PetscObject)l2gmap),PETSC_ERR_PLIB,"BDDCGraph already initialized");
1124   /* set number of vertices */
1125   ierr = PetscObjectReference((PetscObject)l2gmap);CHKERRQ(ierr);
1126   graph->l2gmap = l2gmap;
1127   ierr = ISLocalToGlobalMappingGetSize(l2gmap,&n);CHKERRQ(ierr);
1128   graph->nvtxs = n;
1129   graph->nvtxs_global = N;
1130   /* allocate used space */
1131   ierr = PetscBTCreate(graph->nvtxs,&graph->touched);CHKERRQ(ierr);
1132   ierr = PetscMalloc5(graph->nvtxs,&graph->count,
1133                       graph->nvtxs,&graph->neighbours_set,
1134                       graph->nvtxs,&graph->subset,
1135                       graph->nvtxs,&graph->which_dof,
1136                       graph->nvtxs,&graph->special_dof);CHKERRQ(ierr);
1137   /* zeroes memory */
1138   ierr = PetscMemzero(graph->count,graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
1139   ierr = PetscMemzero(graph->subset,graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
1140   /* use -1 as a default value for which_dof array */
1141   for (n=0;n<graph->nvtxs;n++) graph->which_dof[n] = -1;
1142   ierr = PetscMemzero(graph->special_dof,graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
1143   /* zeroes first pointer to neighbour set */
1144   if (graph->nvtxs) {
1145     graph->neighbours_set[0] = 0;
1146   }
1147   /* zeroes workspace for values of ncc */
1148   graph->subset_ncc = 0;
1149   graph->subset_ref_node = 0;
1150   /* maxcount for cc */
1151   graph->maxcount = maxcount;
1152   PetscFunctionReturn(0);
1153 }
1154 
1155 #undef __FUNCT__
1156 #define __FUNCT__ "PCBDDCGraphDestroy"
1157 PetscErrorCode PCBDDCGraphDestroy(PCBDDCGraph* graph)
1158 {
1159   PetscErrorCode ierr;
1160 
1161   PetscFunctionBegin;
1162   ierr = PCBDDCGraphResetCSR(*graph);CHKERRQ(ierr);
1163   ierr = PCBDDCGraphReset(*graph);CHKERRQ(ierr);
1164   ierr = PetscFree(*graph);CHKERRQ(ierr);
1165   PetscFunctionReturn(0);
1166 }
1167 
1168 #undef __FUNCT__
1169 #define __FUNCT__ "PCBDDCGraphCreate"
1170 PetscErrorCode PCBDDCGraphCreate(PCBDDCGraph *graph)
1171 {
1172   PCBDDCGraph    new_graph;
1173   PetscErrorCode ierr;
1174 
1175   PetscFunctionBegin;
1176   ierr = PetscNew(&new_graph);CHKERRQ(ierr);
1177   new_graph->custom_minimal_size = 1;
1178   new_graph->commsizelimit = 1;
1179   *graph = new_graph;
1180   PetscFunctionReturn(0);
1181 }
1182