xref: /petsc/src/mat/tests/ex236.c (revision 8fb5bd83c3955fefcf33a54e3bb66920a9fa884b)
1 static char help[] = "Test CPU/GPU memory leaks, MatMult and MatMultTransposeAdd during successive matrix assemblies\n\n";
2 
3 #include <petscmat.h>
4 
5 int main(int argc,char **argv)
6 {
7   PetscMPIInt rank,size;
8   Mat         A;
9   PetscInt    i,j,k,n = 3,vstart,rstart,rend,margin;
10   Vec         x,y;
11 
12   PetscCall(PetscInitialize(&argc,&argv,(char*)0,help));
13   PetscCallMPI(MPI_Comm_rank(PETSC_COMM_WORLD,&rank));
14   PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size));
15 
16   PetscCall(MatCreate(PETSC_COMM_WORLD,&A));
17   PetscCall(MatSetSizes(A,n,n,PETSC_DECIDE,PETSC_DECIDE));
18   PetscCall(MatSetFromOptions(A));
19 
20   PetscCall(MatMPIAIJSetPreallocation(A,n,NULL,0,NULL));
21   PetscCall(MatSetOption(A,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE));
22   PetscCall(MatGetOwnershipRange(A,&rstart,&rend));
23   PetscCall(MatCreateVecs(A,&x,&y));
24   PetscCall(VecSet(x,1.0));
25 
26   /*
27     Matrix A only has nonzeros in the diagonal block, which is of size 3x3.
28     We do three successive assemblies on A. The first two have the same non-zero
29     pattern but different values, and the third breaks the non-zero pattern. The
30     first two assemblies have enough zero-rows that triggers compressed-row storage
31     in MATAIJ and MATAIJCUSPARSE.
32 
33     These settings are used to test memory management and correctness in MatMult
34     and MatMultTransposeAdd.
35   */
36 
37   for (k=0; k<3; k++) { /* Three assemblies */
38     vstart = (size*k + rank)*n*n+1;
39     margin = (k == 2)? 0 : 2; /* Create two zero-rows in the first two assemblies */
40     for (i=rstart; i<rend-margin; i++) {
41       for (j=rstart; j<rend; j++) {
42         PetscCall(MatSetValue(A,i,j,(PetscScalar)vstart,INSERT_VALUES));
43         vstart++;
44       }
45     }
46     PetscCall(MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY));
47     PetscCall(MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY));
48     PetscCall(MatMult(A,x,y));
49     PetscCall(MatMultTransposeAdd(A,x,y,y)); /* y[i] = sum of row i and column i of A */
50     PetscCall(VecView(y,PETSC_VIEWER_STDOUT_WORLD));
51   }
52 
53   PetscCall(MatDestroy(&A));
54   PetscCall(VecDestroy(&x));
55   PetscCall(VecDestroy(&y));
56   PetscCall(PetscFinalize());
57 
58   /* Uncomment this line if you want to use "cuda-memcheck --leaf-check full" to check this program */
59   /*cudaDeviceReset();*/
60   return 0;
61 }
62 
63 /*TEST
64 
65    testset:
66      nsize: 2
67      output_file: output/ex236_1.out
68      filter: grep -v type
69 
70      test:
71        args: -mat_type aij
72 
73      test:
74        requires: cuda
75        suffix: cuda
76        args: -mat_type aijcusparse
77 TEST*/
78