1c4762a1bSJed Brown static const char help[] = "Test overlapped communication on a single star forest (PetscSF)\n\n"; 2c4762a1bSJed Brown 3c4762a1bSJed Brown #include <petscvec.h> 4c4762a1bSJed Brown #include <petscsf.h> 5c4762a1bSJed Brown #include <petscviewer.h> 6c4762a1bSJed Brown 7c4762a1bSJed Brown int main(int argc, char **argv) 8c4762a1bSJed Brown { 9c4762a1bSJed Brown PetscSF sf; 10c4762a1bSJed Brown Vec A,Aout; 11c4762a1bSJed Brown Vec B,Bout; 12c4762a1bSJed Brown PetscScalar *bufA; 13c4762a1bSJed Brown PetscScalar *bufAout; 14c4762a1bSJed Brown PetscScalar *bufB; 15c4762a1bSJed Brown PetscScalar *bufBout; 16c4762a1bSJed Brown PetscMPIInt rank, size; 17c4762a1bSJed Brown PetscInt nroots, nleaves; 18c4762a1bSJed Brown PetscInt i; 19c4762a1bSJed Brown PetscInt *ilocal; 20c4762a1bSJed Brown PetscSFNode *iremote; 21c4762a1bSJed Brown 22*b122ec5aSJacob Faibussowitsch CHKERRQ(PetscInitialize(&argc,&argv,NULL,help)); 235f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_rank(PETSC_COMM_WORLD,&rank)); 245f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size)); 25c4762a1bSJed Brown 262c71b3e2SJacob Faibussowitsch PetscCheckFalse(size != 2,PETSC_COMM_WORLD, PETSC_ERR_USER, "Only coded for two MPI processes"); 27c4762a1bSJed Brown 285f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCreate(PETSC_COMM_WORLD,&sf)); 295f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetFromOptions(sf)); 30c4762a1bSJed Brown 31c4762a1bSJed Brown nleaves = 2; 32c4762a1bSJed Brown nroots = 1; 335f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nleaves,&ilocal)); 34c4762a1bSJed Brown 35c4762a1bSJed Brown for (i = 0; i<nleaves; i++) { 36c4762a1bSJed Brown ilocal[i] = i; 37c4762a1bSJed Brown } 38c4762a1bSJed Brown 395f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nleaves,&iremote)); 40c4762a1bSJed Brown if (rank == 0) { 41c4762a1bSJed Brown iremote[0].rank = 0; 42c4762a1bSJed Brown iremote[0].index = 0; 43c4762a1bSJed Brown iremote[1].rank = 1; 44c4762a1bSJed Brown iremote[1].index = 0; 45c4762a1bSJed Brown } else { 46c4762a1bSJed Brown iremote[0].rank = 1; 47c4762a1bSJed Brown iremote[0].index = 0; 48c4762a1bSJed Brown iremote[1].rank = 0; 49c4762a1bSJed Brown iremote[1].index = 0; 50c4762a1bSJed Brown } 515f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetGraph(sf,nroots,nleaves,ilocal,PETSC_OWN_POINTER,iremote,PETSC_OWN_POINTER)); 525f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetUp(sf)); 535f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFView(sf,PETSC_VIEWER_STDOUT_WORLD)); 545f80ce2aSJacob Faibussowitsch CHKERRQ(VecCreate(PETSC_COMM_WORLD,&A)); 555f80ce2aSJacob Faibussowitsch CHKERRQ(VecSetSizes(A,2,PETSC_DETERMINE)); 565f80ce2aSJacob Faibussowitsch CHKERRQ(VecSetFromOptions(A)); 575f80ce2aSJacob Faibussowitsch CHKERRQ(VecSetUp(A)); 58c4762a1bSJed Brown 595f80ce2aSJacob Faibussowitsch CHKERRQ(VecDuplicate(A,&B)); 605f80ce2aSJacob Faibussowitsch CHKERRQ(VecDuplicate(A,&Aout)); 615f80ce2aSJacob Faibussowitsch CHKERRQ(VecDuplicate(A,&Bout)); 625f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(A,&bufA)); 635f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(B,&bufB)); 64c4762a1bSJed Brown for (i=0; i<2; i++) { 65c4762a1bSJed Brown bufA[i] = (PetscScalar)rank; 66c4762a1bSJed Brown bufB[i] = (PetscScalar)(rank) + 10.0; 67c4762a1bSJed Brown } 685f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(A,&bufA)); 695f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(B,&bufB)); 70c4762a1bSJed Brown 715f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArrayRead(A,(const PetscScalar**)&bufA)); 725f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArrayRead(B,(const PetscScalar**)&bufB)); 735f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(Aout,&bufAout)); 745f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(Bout,&bufBout)); 755f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastBegin(sf,MPIU_SCALAR,(const void*)bufA,(void *)bufAout,MPI_REPLACE)); 765f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastBegin(sf,MPIU_SCALAR,(const void*)bufB,(void *)bufBout,MPI_REPLACE)); 775f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastEnd(sf,MPIU_SCALAR,(const void*)bufA,(void *)bufAout,MPI_REPLACE)); 785f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastEnd(sf,MPIU_SCALAR,(const void*)bufB,(void *)bufBout,MPI_REPLACE)); 795f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArrayRead(A,(const PetscScalar**)&bufA)); 805f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArrayRead(B,(const PetscScalar**)&bufB)); 815f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(Aout,&bufAout)); 825f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(Bout,&bufBout)); 83c4762a1bSJed Brown 845f80ce2aSJacob Faibussowitsch CHKERRQ(VecView(Aout,PETSC_VIEWER_STDOUT_WORLD)); 855f80ce2aSJacob Faibussowitsch CHKERRQ(VecView(Bout,PETSC_VIEWER_STDOUT_WORLD)); 865f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&A)); 875f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&B)); 885f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&Aout)); 895f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&Bout)); 905f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&sf)); 91c4762a1bSJed Brown 92*b122ec5aSJacob Faibussowitsch CHKERRQ(PetscFinalize()); 93*b122ec5aSJacob Faibussowitsch return 0; 94c4762a1bSJed Brown } 95c4762a1bSJed Brown 96c4762a1bSJed Brown /*TEST 97c4762a1bSJed Brown 98c4762a1bSJed Brown test: 99c4762a1bSJed Brown suffix: basic 100c4762a1bSJed Brown nsize: 2 101c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 102c4762a1bSJed Brown args: -sf_type basic 103c4762a1bSJed Brown 104c4762a1bSJed Brown test: 105c4762a1bSJed Brown suffix: window 106c4762a1bSJed Brown nsize: 2 107c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 108c4762a1bSJed Brown output_file: output/ex2_basic.out 109c4762a1bSJed Brown args: -sf_type window -sf_window_sync {{fence active lock}} -sf_window_flavor {{create dynamic allocate}} 110dfd57a17SPierre Jolivet requires: defined(PETSC_HAVE_MPI_ONE_SIDED) defined(PETSC_HAVE_MPI_FEATURE_DYNAMIC_WINDOW) 111c4762a1bSJed Brown 112c4762a1bSJed Brown # The nightly test suite with MPICH uses ch3:sock, which is broken when winsize == 0 in some of the processes 113c4762a1bSJed Brown test: 114c4762a1bSJed Brown suffix: window_shared 115c4762a1bSJed Brown nsize: 2 116c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 117c4762a1bSJed Brown output_file: output/ex2_basic.out 118c4762a1bSJed Brown args: -sf_type window -sf_window_sync {{fence active lock}} -sf_window_flavor shared 119dfd57a17SPierre Jolivet requires: defined(PETSC_HAVE_MPI_PROCESS_SHARED_MEMORY) !defined(PETSC_HAVE_MPICH_NUMVERSION) defined(PETSC_HAVE_MPI_ONE_SIDED) 120c4762a1bSJed Brown 121c4762a1bSJed Brown TEST*/ 122