xref: /petsc/src/vec/is/sf/tutorials/ex2.c (revision 65c78980d86b286952aba5ac84149d487245284f)
1 static const char help[] = "Test overlapped communication on a single star forest (PetscSF)\n\n";
2 
3 #include <petscvec.h>
4 #include <petscsf.h>
5 #include <petscviewer.h>
6 
7 int main(int argc, char **argv)
8 {
9   PetscSF     sf;
10   Vec         A,Aout;
11   Vec         B,Bout;
12   PetscScalar *bufA;
13   PetscScalar *bufAout;
14   PetscScalar *bufB;
15   PetscScalar *bufBout;
16   PetscMPIInt rank, size;
17   PetscInt    nroots, nleaves;
18   PetscInt    i;
19   PetscInt    *ilocal;
20   PetscSFNode *iremote;
21 
22   PetscFunctionBeginUser;
23   PetscCall(PetscInitialize(&argc,&argv,NULL,help));
24   PetscCallMPI(MPI_Comm_rank(PETSC_COMM_WORLD,&rank));
25   PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size));
26 
27   PetscCheck(size == 2,PETSC_COMM_WORLD, PETSC_ERR_USER, "Only coded for two MPI processes");
28 
29   PetscCall(PetscSFCreate(PETSC_COMM_WORLD,&sf));
30   PetscCall(PetscSFSetFromOptions(sf));
31 
32   nleaves = 2;
33   nroots = 1;
34   PetscCall(PetscMalloc1(nleaves,&ilocal));
35 
36   for (i = 0; i<nleaves; i++) {
37     ilocal[i] = i;
38   }
39 
40   PetscCall(PetscMalloc1(nleaves,&iremote));
41   if (rank == 0) {
42     iremote[0].rank = 0;
43     iremote[0].index = 0;
44     iremote[1].rank = 1;
45     iremote[1].index = 0;
46   } else {
47     iremote[0].rank = 1;
48     iremote[0].index = 0;
49     iremote[1].rank = 0;
50     iremote[1].index = 0;
51   }
52   PetscCall(PetscSFSetGraph(sf,nroots,nleaves,ilocal,PETSC_OWN_POINTER,iremote,PETSC_OWN_POINTER));
53   PetscCall(PetscSFSetUp(sf));
54   PetscCall(PetscSFView(sf,PETSC_VIEWER_STDOUT_WORLD));
55   PetscCall(VecCreate(PETSC_COMM_WORLD,&A));
56   PetscCall(VecSetSizes(A,2,PETSC_DETERMINE));
57   PetscCall(VecSetFromOptions(A));
58   PetscCall(VecSetUp(A));
59 
60   PetscCall(VecDuplicate(A,&B));
61   PetscCall(VecDuplicate(A,&Aout));
62   PetscCall(VecDuplicate(A,&Bout));
63   PetscCall(VecGetArray(A,&bufA));
64   PetscCall(VecGetArray(B,&bufB));
65   for (i=0; i<2; i++) {
66     bufA[i] = (PetscScalar)rank;
67     bufB[i] = (PetscScalar)(rank) + 10.0;
68   }
69   PetscCall(VecRestoreArray(A,&bufA));
70   PetscCall(VecRestoreArray(B,&bufB));
71 
72   PetscCall(VecGetArrayRead(A,(const PetscScalar**)&bufA));
73   PetscCall(VecGetArrayRead(B,(const PetscScalar**)&bufB));
74   PetscCall(VecGetArray(Aout,&bufAout));
75   PetscCall(VecGetArray(Bout,&bufBout));
76   PetscCall(PetscSFBcastBegin(sf,MPIU_SCALAR,(const void*)bufA,(void *)bufAout,MPI_REPLACE));
77   PetscCall(PetscSFBcastBegin(sf,MPIU_SCALAR,(const void*)bufB,(void *)bufBout,MPI_REPLACE));
78   PetscCall(PetscSFBcastEnd(sf,MPIU_SCALAR,(const void*)bufA,(void *)bufAout,MPI_REPLACE));
79   PetscCall(PetscSFBcastEnd(sf,MPIU_SCALAR,(const void*)bufB,(void *)bufBout,MPI_REPLACE));
80   PetscCall(VecRestoreArrayRead(A,(const PetscScalar**)&bufA));
81   PetscCall(VecRestoreArrayRead(B,(const PetscScalar**)&bufB));
82   PetscCall(VecRestoreArray(Aout,&bufAout));
83   PetscCall(VecRestoreArray(Bout,&bufBout));
84 
85   PetscCall(VecView(Aout,PETSC_VIEWER_STDOUT_WORLD));
86   PetscCall(VecView(Bout,PETSC_VIEWER_STDOUT_WORLD));
87   PetscCall(VecDestroy(&A));
88   PetscCall(VecDestroy(&B));
89   PetscCall(VecDestroy(&Aout));
90   PetscCall(VecDestroy(&Bout));
91   PetscCall(PetscSFDestroy(&sf));
92 
93   PetscCall(PetscFinalize());
94   return 0;
95 }
96 
97 /*TEST
98 
99    test:
100       suffix: basic
101       nsize: 2
102       filter: grep -v "type" | grep -v "sort"
103       args: -sf_type basic
104 
105    test:
106       suffix: window
107       nsize: 2
108       filter: grep -v "type" | grep -v "sort"
109       output_file: output/ex2_basic.out
110       args: -sf_type window -sf_window_sync {{fence active lock}} -sf_window_flavor {{create dynamic allocate}}
111       requires: defined(PETSC_HAVE_MPI_ONE_SIDED) defined(PETSC_HAVE_MPI_FEATURE_DYNAMIC_WINDOW)
112 
113    # The nightly test suite with MPICH uses ch3:sock, which is broken when winsize == 0 in some of the processes
114    test:
115       suffix: window_shared
116       nsize: 2
117       filter: grep -v "type" | grep -v "sort"
118       output_file: output/ex2_basic.out
119       args: -sf_type window -sf_window_sync {{fence active lock}} -sf_window_flavor shared
120       requires: defined(PETSC_HAVE_MPI_PROCESS_SHARED_MEMORY) !defined(PETSC_HAVE_MPICH_NUMVERSION) defined(PETSC_HAVE_MPI_ONE_SIDED)
121 
122 TEST*/
123