1936c5a86SJed Brown /* 2936c5a86SJed Brown A star forest (SF) describes a communication pattern 3936c5a86SJed Brown */ 426bd1501SBarry Smith #if !defined(PETSCSF_H) 526bd1501SBarry Smith #define PETSCSF_H 62c8e378dSBarry Smith #include <petscsys.h> 7dd5b3ca6SJunchao Zhang #include <petscis.h> 80c312b8eSJed Brown #include <petscsftypes.h> 9936c5a86SJed Brown 10014dd563SJed Brown PETSC_EXTERN PetscClassId PETSCSF_CLASSID; 11936c5a86SJed Brown 125af141bcSJed Brown /*J 13dd5b3ca6SJunchao Zhang PetscSFType - String with the name of a PetscSF type 145af141bcSJed Brown 155af141bcSJed Brown Level: beginner 165af141bcSJed Brown 175af141bcSJed Brown .seealso: PetscSFSetType(), PetscSF 185af141bcSJed Brown J*/ 195af141bcSJed Brown typedef const char *PetscSFType; 20ac762476SJed Brown #define PETSCSFBASIC "basic" 21027eff8aSJunchao Zhang #define PETSCSFNEIGHBOR "neighbor" 22dd5b3ca6SJunchao Zhang #define PETSCSFALLGATHERV "allgatherv" 23dd5b3ca6SJunchao Zhang #define PETSCSFALLGATHER "allgather" 24dd5b3ca6SJunchao Zhang #define PETSCSFGATHERV "gatherv" 25dd5b3ca6SJunchao Zhang #define PETSCSFGATHER "gather" 26dd5b3ca6SJunchao Zhang #define PETSCSFALLTOALL "alltoall" 27ed658588SBarry Smith #define PETSCSFWINDOW "window" 285af141bcSJed Brown 29936c5a86SJed Brown /*E 30dd5b3ca6SJunchao Zhang PetscSFPattern - Pattern of the PetscSF graph 31dd5b3ca6SJunchao Zhang 32dd5b3ca6SJunchao Zhang $ PETSCSF_PATTERN_GENERAL - A general graph. One sets the graph with PetscSFSetGraph() and usually does not use this enum directly. 33dd5b3ca6SJunchao Zhang $ PETSCSF_PATTERN_ALLGATHER - A graph that every rank gathers all roots from all ranks (like MPI_Allgather/v). One sets the graph with PetscSFSetGraphWithPattern(). 34dd5b3ca6SJunchao Zhang $ PETSCSF_PATTERN_GATHER - A graph that rank 0 gathers all roots from all ranks (like MPI_Gather/v with root=0). One sets the graph with PetscSFSetGraphWithPattern(). 35dd5b3ca6SJunchao Zhang $ PETSCSF_PATTERN_ALLTOALL - A graph that every rank gathers different roots from all ranks (like MPI_Alltoall). One sets the graph with PetscSFSetGraphWithPattern(). 36dd5b3ca6SJunchao Zhang In an ALLTOALL graph, we assume each process has <size> leaves and <size> roots, with each leaf connecting to a remote root. Here <size> is 37dd5b3ca6SJunchao Zhang the size of the communicator. This does not mean one can not communicate multiple data items between a pair of processes. One just needs to 38dd5b3ca6SJunchao Zhang create a new MPI datatype for the multiple data items, e.g., by MPI_Type_contiguous. 39dd5b3ca6SJunchao Zhang Level: beginner 40dd5b3ca6SJunchao Zhang 41dd5b3ca6SJunchao Zhang .seealso: PetscSFSetGraph(), PetscSFSetGraphWithPattern() 42dd5b3ca6SJunchao Zhang E*/ 43dd5b3ca6SJunchao Zhang typedef enum {PETSCSF_PATTERN_GENERAL=0,PETSCSF_PATTERN_ALLGATHER,PETSCSF_PATTERN_GATHER,PETSCSF_PATTERN_ALLTOALL} PetscSFPattern; 44dd5b3ca6SJunchao Zhang 45dd5b3ca6SJunchao Zhang /*E 465af141bcSJed Brown PetscSFWindowSyncType - Type of synchronization for PETSCSFWINDOW 47936c5a86SJed Brown 485af141bcSJed Brown $ PETSCSF_WINDOW_SYNC_FENCE - simplest model, synchronizing across communicator 495af141bcSJed Brown $ PETSCSF_WINDOW_SYNC_LOCK - passive model, less synchronous, requires less setup than PETSCSF_WINDOW_SYNC_ACTIVE, but may require more handshakes 505af141bcSJed Brown $ PETSCSF_WINDOW_SYNC_ACTIVE - active model, provides most information to MPI implementation, needs to construct 2-way process groups (more setup than PETSCSF_WINDOW_SYNC_LOCK) 51936c5a86SJed Brown 52e84a5f06SJed Brown Level: advanced 53936c5a86SJed Brown 54e84a5f06SJed Brown .seealso: PetscSFWindowSetSyncType(), PetscSFWindowGetSyncType() 55936c5a86SJed Brown E*/ 565af141bcSJed Brown typedef enum {PETSCSF_WINDOW_SYNC_FENCE,PETSCSF_WINDOW_SYNC_LOCK,PETSCSF_WINDOW_SYNC_ACTIVE} PetscSFWindowSyncType; 575af141bcSJed Brown PETSC_EXTERN const char *const PetscSFWindowSyncTypes[]; 58936c5a86SJed Brown 59e84a5f06SJed Brown /*E 605b0d146aSStefano Zampini PetscSFWindowFlavorType - Flavor for the creation of MPI windows for PETSCSFWINDOW 615b0d146aSStefano Zampini 625b0d146aSStefano Zampini $ PETSCSF_WINDOW_FLAVOR_CREATE - Use MPI_Win_create, no reusage 635b0d146aSStefano Zampini $ PETSCSF_WINDOW_FLAVOR_DYNAMIC - Use MPI_Win_create_dynamic and dynamically attach pointers 645b0d146aSStefano Zampini $ PETSCSF_WINDOW_FLAVOR_ALLOCATE - Use MPI_Win_allocate 655b0d146aSStefano Zampini $ PETSCSF_WINDOW_FLAVOR_SHARED - Use MPI_Win_allocate_shared 665b0d146aSStefano Zampini 675b0d146aSStefano Zampini Level: advanced 685b0d146aSStefano Zampini 695b0d146aSStefano Zampini .seealso: PetscSFWindowSetFlavorType(), PetscSFWindowGetFlavorType() 705b0d146aSStefano Zampini E*/ 715b0d146aSStefano Zampini typedef enum {PETSCSF_WINDOW_FLAVOR_CREATE,PETSCSF_WINDOW_FLAVOR_DYNAMIC,PETSCSF_WINDOW_FLAVOR_ALLOCATE,PETSCSF_WINDOW_FLAVOR_SHARED} PetscSFWindowFlavorType; 725b0d146aSStefano Zampini PETSC_EXTERN const char *const PetscSFWindowFlavorTypes[]; 735b0d146aSStefano Zampini 745b0d146aSStefano Zampini /*E 75e84a5f06SJed Brown PetscSFDuplicateOption - Aspects to preserve when duplicating a PetscSF 76e84a5f06SJed Brown 77e84a5f06SJed Brown $ PETSCSF_DUPLICATE_CONFONLY - configuration only, user must call PetscSFSetGraph() 78e84a5f06SJed Brown $ PETSCSF_DUPLICATE_RANKS - communication ranks preserved, but different graph (allows simpler setup after calling PetscSFSetGraph()) 79e84a5f06SJed Brown $ PETSCSF_DUPLICATE_GRAPH - entire graph duplicated 80e84a5f06SJed Brown 81e84a5f06SJed Brown Level: beginner 82e84a5f06SJed Brown 83e84a5f06SJed Brown .seealso: PetscSFDuplicate() 84e84a5f06SJed Brown E*/ 85e84a5f06SJed Brown typedef enum {PETSCSF_DUPLICATE_CONFONLY,PETSCSF_DUPLICATE_RANKS,PETSCSF_DUPLICATE_GRAPH} PetscSFDuplicateOption; 86e84a5f06SJed Brown PETSC_EXTERN const char *const PetscSFDuplicateOptions[]; 87090c6444SJed Brown 88adc40e5bSBarry Smith PETSC_EXTERN PetscFunctionList PetscSFList; 89bdf89e91SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFRegister(const char[],PetscErrorCode (*)(PetscSF)); 905af141bcSJed Brown 91607a6623SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFInitializePackage(void); 92014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFFinalizePackage(void); 9379c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFCreate(MPI_Comm,PetscSF*); 94014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFDestroy(PetscSF*); 955af141bcSJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetType(PetscSF,PetscSFType); 9629046d53SLisandro Dalcin PETSC_EXTERN PetscErrorCode PetscSFGetType(PetscSF,PetscSFType*); 97014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFView(PetscSF,PetscViewer); 98fe2efc57SMark PETSC_EXTERN PetscErrorCode PetscSFViewFromOptions(PetscSF,PetscObject,const char[]); 995af141bcSJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetUp(PetscSF); 100014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetFromOptions(PetscSF); 101e84a5f06SJed Brown PETSC_EXTERN PetscErrorCode PetscSFDuplicate(PetscSF,PetscSFDuplicateOption,PetscSF*); 1025af141bcSJed Brown PETSC_EXTERN PetscErrorCode PetscSFWindowSetSyncType(PetscSF,PetscSFWindowSyncType); 1035af141bcSJed Brown PETSC_EXTERN PetscErrorCode PetscSFWindowGetSyncType(PetscSF,PetscSFWindowSyncType*); 1045b0d146aSStefano Zampini PETSC_EXTERN PetscErrorCode PetscSFWindowSetFlavorType(PetscSF,PetscSFWindowFlavorType); 1055b0d146aSStefano Zampini PETSC_EXTERN PetscErrorCode PetscSFWindowGetFlavorType(PetscSF,PetscSFWindowFlavorType*); 1062eb0eadbSSatish Balay PETSC_EXTERN PetscErrorCode PetscSFWindowSetInfo(PetscSF,MPI_Info); 1072eb0eadbSSatish Balay PETSC_EXTERN PetscErrorCode PetscSFWindowGetInfo(PetscSF,MPI_Info*); 108014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetRankOrder(PetscSF,PetscBool); 10963f4a732SJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetGraph(PetscSF,PetscInt,PetscInt,const PetscInt*,PetscCopyMode,const PetscSFNode*,PetscCopyMode); 110dd5b3ca6SJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFSetGraphWithPattern(PetscSF,PetscLayout,PetscSFPattern); 11179c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFGetGraph(PetscSF,PetscInt*,PetscInt*,const PetscInt**,const PetscSFNode**); 112f723732fSJed Brown PETSC_EXTERN PetscErrorCode PetscSFGetLeafRange(PetscSF,PetscInt*,PetscInt*); 11379c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFCreateEmbeddedSF(PetscSF,PetscInt,const PetscInt*,PetscSF*); 1142f5fb4c2SMatthew G. Knepley PETSC_EXTERN PetscErrorCode PetscSFCreateEmbeddedLeafSF(PetscSF,PetscInt,const PetscInt *, PetscSF *); 115014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFReset(PetscSF); 116b5a8e515SJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetUpRanks(PetscSF,MPI_Group); 117dec1416fSJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFGetRootRanks(PetscSF,PetscInt*,const PetscMPIInt**,const PetscInt**,const PetscInt**,const PetscInt**); 1188750ddebSJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFGetLeafRanks(PetscSF,PetscInt*,const PetscMPIInt**,const PetscInt**,const PetscInt**); 119014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFGetGroups(PetscSF,MPI_Group*,MPI_Group*); 120014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFGetMultiSF(PetscSF,PetscSF*); 121014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFCreateInverseSF(PetscSF,PetscSF*); 122936c5a86SJed Brown 1233482bfa8SJunchao Zhang /* Reduce rootdata to leafdata using provided operation */ 1243482bfa8SJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFBcastAndOpBegin(PetscSF,MPI_Datatype,const void*,void*,MPI_Op) 1253482bfa8SJunchao Zhang PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 1263482bfa8SJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFBcastAndOpEnd(PetscSF,MPI_Datatype,const void*,void*,MPI_Op) 1273482bfa8SJunchao Zhang PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 128*d0295fc0SJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFBcastAndOpWithMemTypeBegin(PetscSF,MPI_Datatype,PetscMemType,const void*,PetscMemType,void*,MPI_Op) 129*d0295fc0SJunchao Zhang PetscAttrMPIPointerWithType(4,2) PetscAttrMPIPointerWithType(6,2); 130*d0295fc0SJunchao Zhang 131936c5a86SJed Brown /* Reduce leafdata into rootdata using provided operation */ 13279c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFReduceBegin(PetscSF,MPI_Datatype,const void*,void *,MPI_Op) 13319436ca2SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 13479c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFReduceEnd(PetscSF,MPI_Datatype,const void*,void*,MPI_Op) 13519436ca2SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 136*d0295fc0SJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFReduceWithMemTypeBegin(PetscSF,MPI_Datatype,PetscMemType,const void*,PetscMemType,void *,MPI_Op) 137*d0295fc0SJunchao Zhang PetscAttrMPIPointerWithType(4,2) PetscAttrMPIPointerWithType(6,2); 138936c5a86SJed Brown /* Atomically modifies (using provided operation) rootdata using leafdata from each leaf, value at root at time of modification is returned in leafupdate. */ 13979c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFFetchAndOpBegin(PetscSF,MPI_Datatype,void*,const void*,void*,MPI_Op) 140894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2) PetscAttrMPIPointerWithType(5,2); 14179c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFFetchAndOpEnd(PetscSF,MPI_Datatype,void*,const void*,void*,MPI_Op) 142894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2) PetscAttrMPIPointerWithType(5,2); 143936c5a86SJed Brown /* Compute the degree of every root vertex (number of leaves in its star) */ 14479c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFComputeDegreeBegin(PetscSF,const PetscInt**); 14579c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFComputeDegreeEnd(PetscSF,const PetscInt**); 14666dfcd1aSVaclav Hapla PETSC_EXTERN PetscErrorCode PetscSFComputeMultiRootOriginalNumbering(PetscSF,const PetscInt[],PetscInt*,PetscInt*[]); 147936c5a86SJed Brown /* Concatenate data from all leaves into roots */ 14879c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFGatherBegin(PetscSF,MPI_Datatype,const void*,void*) 149894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 15079c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFGatherEnd(PetscSF,MPI_Datatype,const void*,void*) 151894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 152936c5a86SJed Brown /* Distribute distinct values to each leaf from roots */ 15379c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFScatterBegin(PetscSF,MPI_Datatype,const void*,void*) 154894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 15579c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFScatterEnd(PetscSF,MPI_Datatype,const void*,void*) 156894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 157936c5a86SJed Brown 158a7b3aa13SAta Mesgarnejad PETSC_EXTERN PetscErrorCode PetscSFCompose(PetscSF,PetscSF,PetscSF*); 15904c0ada0SJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFComposeInverse(PetscSF,PetscSF,PetscSF*); 160a7b3aa13SAta Mesgarnejad 1618bfbc91cSJed Brown #if defined(MPI_REPLACE) 1628bfbc91cSJed Brown # define MPIU_REPLACE MPI_REPLACE 1638bfbc91cSJed Brown #else 1648bfbc91cSJed Brown /* When using an old MPI such that MPI_REPLACE is not defined, we do not pass MPI_REPLACE to MPI at all. Instead, we 1658bfbc91cSJed Brown * use it as a flag for our own reducer in the PETSCSFBASIC implementation. This could be any unique value unlikely to 1668bfbc91cSJed Brown * collide with another MPI_Op so we'll just use the value that has been used by every version of MPICH since 1678bfbc91cSJed Brown * MPICH2-1.0.6. */ 1688bfbc91cSJed Brown # define MPIU_REPLACE (MPI_Op)(0x5800000d) 1698bfbc91cSJed Brown #endif 1708bfbc91cSJed Brown 171dec1416fSJunchao Zhang PETSC_DEPRECATED_FUNCTION("Use PetscSFGetRootRanks (since v3.12)") 172dec1416fSJunchao Zhang PETSC_STATIC_INLINE PetscErrorCode PetscSFGetRanks(PetscSF sf,PetscInt *nranks,const PetscMPIInt **ranks,const PetscInt **roffset,const PetscInt **rmine,const PetscInt **rremote) { 173dec1416fSJunchao Zhang return PetscSFGetRootRanks(sf,nranks,ranks,roffset,rmine,rremote); 174dec1416fSJunchao Zhang } 175e2652d4cSJunchao Zhang 176c73c85a0SVaclav Hapla /*@C 177c73c85a0SVaclav Hapla PetscSFBcastBegin - begin pointwise broadcast to be concluded with call to PetscSFBcastEnd() 178c73c85a0SVaclav Hapla 179c73c85a0SVaclav Hapla Collective on PetscSF 180c73c85a0SVaclav Hapla 181c73c85a0SVaclav Hapla Input Arguments: 182c73c85a0SVaclav Hapla + sf - star forest on which to communicate 183c73c85a0SVaclav Hapla . unit - data type associated with each node 184c73c85a0SVaclav Hapla - rootdata - buffer to broadcast 185c73c85a0SVaclav Hapla 186c73c85a0SVaclav Hapla Output Arguments: 187c73c85a0SVaclav Hapla . leafdata - buffer to update with values from each leaf's respective root 188c73c85a0SVaclav Hapla 189c73c85a0SVaclav Hapla Level: intermediate 190c73c85a0SVaclav Hapla 1918eeec653SVaclav Hapla .seealso: PetscSFCreate(), PetscSFSetGraph(), PetscSFView(), PetscSFBcastEnd(), PetscSFReduceBegin(), PetscSFBcastAndOpBegin() 192c73c85a0SVaclav Hapla @*/ 193e2652d4cSJunchao Zhang PETSC_STATIC_INLINE PetscErrorCode PetscSFBcastBegin(PetscSF sf,MPI_Datatype unit,const void* rootdata,void* leafdata) { 194e2652d4cSJunchao Zhang return PetscSFBcastAndOpBegin(sf,unit,rootdata,leafdata,MPIU_REPLACE); 195e2652d4cSJunchao Zhang } 196c73c85a0SVaclav Hapla 197*d0295fc0SJunchao Zhang PETSC_STATIC_INLINE PetscErrorCode PetscSFBcastWithMemTypeBegin(PetscSF sf,MPI_Datatype unit,PetscMemType rootmtype,const void* rootdata,PetscMemType leafmtype,void* leafdata) { 198*d0295fc0SJunchao Zhang return PetscSFBcastAndOpWithMemTypeBegin(sf,unit,rootmtype,rootdata,leafmtype,leafdata,MPIU_REPLACE); 199*d0295fc0SJunchao Zhang } 200*d0295fc0SJunchao Zhang 201c73c85a0SVaclav Hapla /*@C 202c73c85a0SVaclav Hapla PetscSFBcastEnd - end a broadcast operation started with PetscSFBcastBegin() 203c73c85a0SVaclav Hapla 204c73c85a0SVaclav Hapla Collective 205c73c85a0SVaclav Hapla 206c73c85a0SVaclav Hapla Input Arguments: 207c73c85a0SVaclav Hapla + sf - star forest 208c73c85a0SVaclav Hapla . unit - data type 209c73c85a0SVaclav Hapla - rootdata - buffer to broadcast 210c73c85a0SVaclav Hapla 211c73c85a0SVaclav Hapla Output Arguments: 212c73c85a0SVaclav Hapla . leafdata - buffer to update with values from each leaf's respective root 213c73c85a0SVaclav Hapla 214c73c85a0SVaclav Hapla Level: intermediate 215c73c85a0SVaclav Hapla 216c73c85a0SVaclav Hapla .seealso: PetscSFSetGraph(), PetscSFReduceEnd() 217c73c85a0SVaclav Hapla @*/ 218e2652d4cSJunchao Zhang PETSC_STATIC_INLINE PetscErrorCode PetscSFBcastEnd(PetscSF sf,MPI_Datatype unit,const void* rootdata,void* leafdata) { 219e2652d4cSJunchao Zhang return PetscSFBcastAndOpEnd(sf,unit,rootdata,leafdata,MPIU_REPLACE); 220e2652d4cSJunchao Zhang } 221e2652d4cSJunchao Zhang 222936c5a86SJed Brown #endif 223