static char help[] = "Test CPU/GPU memory leaks, MatMult and MatMultTransposeAdd during successive matrix assemblies\n\n"; #include int main(int argc, char **argv) { PetscMPIInt rank, size; Mat A; PetscInt i, j, k, n = 3, vstart, rstart, rend, margin; Vec x, y; PetscFunctionBeginUser; PetscCall(PetscInitialize(&argc, &argv, NULL, help)); PetscCallMPI(MPI_Comm_rank(PETSC_COMM_WORLD, &rank)); PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD, &size)); PetscCall(MatCreate(PETSC_COMM_WORLD, &A)); PetscCall(MatSetSizes(A, n, n, PETSC_DECIDE, PETSC_DECIDE)); PetscCall(MatSetFromOptions(A)); PetscCall(MatMPIAIJSetPreallocation(A, n, NULL, 0, NULL)); PetscCall(MatSetOption(A, MAT_NEW_NONZERO_ALLOCATION_ERR, PETSC_FALSE)); PetscCall(MatGetOwnershipRange(A, &rstart, &rend)); PetscCall(MatCreateVecs(A, &x, &y)); PetscCall(VecSet(x, 1.0)); /* Matrix A only has nonzeros in the diagonal block, which is of size 3x3. We do three successive assemblies on A. The first two have the same non-zero pattern but different values, and the third breaks the non-zero pattern. The first two assemblies have enough zero-rows that triggers compressed-row storage in MATAIJ and MATAIJCUSPARSE. These settings are used to test memory management and correctness in MatMult and MatMultTransposeAdd. */ for (k = 0; k < 3; k++) { /* Three assemblies */ vstart = (size * k + rank) * n * n + 1; margin = (k == 2) ? 0 : 2; /* Create two zero-rows in the first two assemblies */ for (i = rstart; i < rend - margin; i++) { for (j = rstart; j < rend; j++) { PetscCall(MatSetValue(A, i, j, (PetscScalar)vstart, INSERT_VALUES)); vstart++; } } PetscCall(MatAssemblyBegin(A, MAT_FINAL_ASSEMBLY)); PetscCall(MatAssemblyEnd(A, MAT_FINAL_ASSEMBLY)); PetscCall(MatMult(A, x, y)); PetscCall(MatMultTransposeAdd(A, x, y, y)); /* y[i] = sum of row i and column i of A */ PetscCall(VecView(y, PETSC_VIEWER_STDOUT_WORLD)); } PetscCall(MatDestroy(&A)); PetscCall(VecDestroy(&x)); PetscCall(VecDestroy(&y)); PetscCall(PetscFinalize()); /* Uncomment this line if you want to use "compute-sanitizer --tool memcheck [sanitizer_options] app_name [app_options]" to check this program */ /*cudaDeviceReset();*/ return 0; } /*TEST testset: nsize: 2 output_file: output/ex236_1.out filter: grep -v type test: args: -mat_type aij test: requires: cuda suffix: cuda args: -mat_type aijcusparse TEST*/