142565d0bSMatthew G. Knepley static char help[] = "Exhaustive memory tracking for DMPlex.\n\n\n"; 242565d0bSMatthew G. Knepley 342565d0bSMatthew G. Knepley #include <petscdmplex.h> 442565d0bSMatthew G. Knepley 5d71ae5a4SJacob Faibussowitsch static PetscErrorCode EstimateMemory(DM dm, PetscLogDouble *est) 6d71ae5a4SJacob Faibussowitsch { 742565d0bSMatthew G. Knepley DMLabel marker; 842565d0bSMatthew G. Knepley PetscInt cdim, depth, d, pStart, pEnd, p, Nd[4] = {0, 0, 0, 0}, lsize = 0, rmem = 0, imem = 0; 942565d0bSMatthew G. Knepley PetscInt coneSecMem = 0, coneMem = 0, supportSecMem = 0, supportMem = 0, labelMem = 0; 1042565d0bSMatthew G. Knepley 1142565d0bSMatthew G. Knepley PetscFunctionBeginUser; 129566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, "Memory Estimates\n")); 139566063dSJacob Faibussowitsch PetscCall(DMGetCoordinateDim(dm, &cdim)); 149566063dSJacob Faibussowitsch PetscCall(DMPlexGetDepth(dm, &depth)); 159566063dSJacob Faibussowitsch PetscCall(DMPlexGetChart(dm, &pStart, &pEnd)); 1642565d0bSMatthew G. Knepley for (d = 0; d <= depth; ++d) { 1742565d0bSMatthew G. Knepley PetscInt start, end; 1842565d0bSMatthew G. Knepley 199566063dSJacob Faibussowitsch PetscCall(DMPlexGetDepthStratum(dm, d, &start, &end)); 2042565d0bSMatthew G. Knepley Nd[d] = end - start; 2142565d0bSMatthew G. Knepley } 2242565d0bSMatthew G. Knepley /* Coordinates: 3 Nv reals + 2*Nv + 2*Nv ints */ 2342565d0bSMatthew G. Knepley rmem += cdim * Nd[0]; 2442565d0bSMatthew G. Knepley imem += 2 * Nd[0] + 2 * Nd[0]; 2563a3b9bcSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, " Coordinate mem: %" PetscInt_FMT " %" PetscInt_FMT "\n", (PetscInt)(cdim * Nd[0] * sizeof(PetscReal)), (PetscInt)(4 * Nd[0] * sizeof(PetscInt)))); 2642565d0bSMatthew G. Knepley /* Depth: Nc+Nf+Ne+Nv ints */ 2742565d0bSMatthew G. Knepley for (d = 0; d <= depth; ++d) labelMem += Nd[d]; 2842565d0bSMatthew G. Knepley /* Cell Type: Nc+Nf+Ne+Nv ints */ 2942565d0bSMatthew G. Knepley for (d = 0; d <= depth; ++d) labelMem += Nd[d]; 3042565d0bSMatthew G. Knepley /* Marker */ 319566063dSJacob Faibussowitsch PetscCall(DMGetLabel(dm, "marker", &marker)); 329566063dSJacob Faibussowitsch if (marker) PetscCall(DMLabelGetStratumSize(marker, 1, &lsize)); 3342565d0bSMatthew G. Knepley labelMem += lsize; 3463a3b9bcSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, " Label mem: %" PetscInt_FMT "\n", (PetscInt)(labelMem * sizeof(PetscInt)))); 3542565d0bSMatthew G. Knepley //imem += labelMem; 3642565d0bSMatthew G. Knepley /* Cones and Orientations: 4 Nc + 3 Nf + 2 Ne ints + (Nc+Nf+Ne) ints no separate orientation section */ 3742565d0bSMatthew G. Knepley for (d = 0; d <= depth; ++d) coneSecMem += 2 * Nd[d]; 3842565d0bSMatthew G. Knepley for (p = pStart; p < pEnd; ++p) { 3942565d0bSMatthew G. Knepley PetscInt csize; 4042565d0bSMatthew G. Knepley 419566063dSJacob Faibussowitsch PetscCall(DMPlexGetConeSize(dm, p, &csize)); 4242565d0bSMatthew G. Knepley coneMem += csize; 4342565d0bSMatthew G. Knepley } 4463a3b9bcSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, " Cone mem: %" PetscInt_FMT " %" PetscInt_FMT " (%" PetscInt_FMT ")\n", (PetscInt)(coneMem * sizeof(PetscInt)), (PetscInt)(coneSecMem * sizeof(PetscInt)), (PetscInt)(coneMem * sizeof(PetscInt)))); 4542565d0bSMatthew G. Knepley imem += 2 * coneMem + coneSecMem; 4642565d0bSMatthew G. Knepley /* Supports: 4 Nc + 3 Nf + 2 Ne ints + Nc+Nf+Ne ints */ 4742565d0bSMatthew G. Knepley for (d = 0; d <= depth; ++d) supportSecMem += 2 * Nd[d]; 4842565d0bSMatthew G. Knepley for (p = pStart; p < pEnd; ++p) { 4942565d0bSMatthew G. Knepley PetscInt ssize; 5042565d0bSMatthew G. Knepley 519566063dSJacob Faibussowitsch PetscCall(DMPlexGetSupportSize(dm, p, &ssize)); 5242565d0bSMatthew G. Knepley supportMem += ssize; 5342565d0bSMatthew G. Knepley } 5463a3b9bcSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_SELF, " Support mem: %" PetscInt_FMT " %" PetscInt_FMT "\n", (PetscInt)(supportMem * sizeof(PetscInt)), (PetscInt)(supportSecMem * sizeof(PetscInt)))); 5542565d0bSMatthew G. Knepley imem += supportMem + supportSecMem; 5642565d0bSMatthew G. Knepley *est = ((PetscLogDouble)imem) * sizeof(PetscInt) + ((PetscLogDouble)rmem) * sizeof(PetscReal); 5763a3b9bcSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD, " Estimated memory %" PetscInt_FMT "\n", (PetscInt)*est)); 5842565d0bSMatthew G. Knepley PetscFunctionReturn(0); 5942565d0bSMatthew G. Knepley } 6042565d0bSMatthew G. Knepley 61d71ae5a4SJacob Faibussowitsch int main(int argc, char **argv) 62d71ae5a4SJacob Faibussowitsch { 6342565d0bSMatthew G. Knepley DM dm; 6442565d0bSMatthew G. Knepley PetscBool trace = PETSC_FALSE, checkMemory = PETSC_TRUE, auxMemory = PETSC_FALSE; 6542565d0bSMatthew G. Knepley PetscLogDouble before, after, est = 0, clean, max; 6642565d0bSMatthew G. Knepley 67327415f7SBarry Smith PetscFunctionBeginUser; 689566063dSJacob Faibussowitsch PetscCall(PetscInitialize(&argc, &argv, NULL, help)); 699566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(NULL, NULL, "-trace", &trace, NULL)); 709566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(NULL, NULL, "-check_memory", &checkMemory, NULL)); 719566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(NULL, NULL, "-aux_memory", &auxMemory, NULL)); 729566063dSJacob Faibussowitsch PetscCall(PetscMemorySetGetMaximumUsage()); 739566063dSJacob Faibussowitsch PetscCall(PetscMallocGetCurrentUsage(&before)); 749566063dSJacob Faibussowitsch if (trace) PetscCall(PetscMallocTraceSet(NULL, PETSC_TRUE, 5000.)); 759566063dSJacob Faibussowitsch PetscCall(DMCreate(PETSC_COMM_WORLD, &dm)); 769566063dSJacob Faibussowitsch PetscCall(DMSetType(dm, DMPLEX)); 779566063dSJacob Faibussowitsch PetscCall(DMSetFromOptions(dm)); 789566063dSJacob Faibussowitsch if (trace) PetscCall(PetscMallocTraceSet(NULL, PETSC_FALSE, 5000)); 799566063dSJacob Faibussowitsch PetscCall(DMViewFromOptions(dm, NULL, "-dm_view")); 809566063dSJacob Faibussowitsch PetscCall(PetscMallocGetCurrentUsage(&after)); 819566063dSJacob Faibussowitsch PetscCall(PetscMemoryGetMaximumUsage(&max)); 829566063dSJacob Faibussowitsch PetscCall(EstimateMemory(dm, &est)); 839566063dSJacob Faibussowitsch PetscCall(DMDestroy(&dm)); 849566063dSJacob Faibussowitsch PetscCall(PetscMallocGetCurrentUsage(&clean)); 859566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD, "Measured Memory\n")); 8642565d0bSMatthew G. Knepley if (auxMemory) { 879371c9d4SSatish Balay PetscCall(PetscPrintf(PETSC_COMM_WORLD, " Initial memory %" PetscInt_FMT "\n Extra memory for build %" PetscInt_FMT "\n Memory after destroy %" PetscInt_FMT "\n", (PetscInt)before, (PetscInt)(max - after), (PetscInt)clean)); 8842565d0bSMatthew G. Knepley } 8942565d0bSMatthew G. Knepley if (checkMemory) { 9063a3b9bcSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD, " Memory for mesh %" PetscInt_FMT "\n", (PetscInt)(after - before))); 9163a3b9bcSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD, "Discrepancy %" PetscInt_FMT "\n", (PetscInt)PetscAbsReal(after - before - est))); 9242565d0bSMatthew G. Knepley } 939566063dSJacob Faibussowitsch PetscCall(PetscFinalize()); 94b122ec5aSJacob Faibussowitsch return 0; 9542565d0bSMatthew G. Knepley } 9642565d0bSMatthew G. Knepley 9742565d0bSMatthew G. Knepley /*TEST 9842565d0bSMatthew G. Knepley build: 99dfd57a17SPierre Jolivet requires: !defined(PETSC_USE_64BIT_INDICES) double !complex !defined(PETSCTEST_VALGRIND) 10042565d0bSMatthew G. Knepley 101a5b23f4aSJose E. Roman # Memory checks cannot be included in tests because the allocated memory differs among environments 10242565d0bSMatthew G. Knepley testset: 103*6c2b77d5SStefano Zampini requires: !defined(PETSC_HAVE_THREADSAFETY) 10442565d0bSMatthew G. Knepley args: -malloc_requested_size -dm_plex_box_faces 5,5 -check_memory 0 10542565d0bSMatthew G. Knepley test: 10642565d0bSMatthew G. Knepley suffix: tri 10742565d0bSMatthew G. Knepley requires: triangle 10830602db0SMatthew G. Knepley args: -dm_plex_simplex 1 -dm_plex_interpolate 0 10942565d0bSMatthew G. Knepley 11042565d0bSMatthew G. Knepley test: 11142565d0bSMatthew G. Knepley suffix: tri_interp 11242565d0bSMatthew G. Knepley requires: triangle 11330602db0SMatthew G. Knepley args: -dm_plex_simplex 1 -dm_plex_interpolate 1 11442565d0bSMatthew G. Knepley 11542565d0bSMatthew G. Knepley test: 11642565d0bSMatthew G. Knepley suffix: quad 11730602db0SMatthew G. Knepley args: -dm_plex_simplex 0 -dm_plex_interpolate 0 11842565d0bSMatthew G. Knepley 11942565d0bSMatthew G. Knepley test: 12042565d0bSMatthew G. Knepley suffix: quad_interp 12130602db0SMatthew G. Knepley args: -dm_plex_simplex 0 -dm_plex_interpolate 1 12242565d0bSMatthew G. Knepley 12330602db0SMatthew G. Knepley # Memory checks cannot be included in tests because the allocated memory differs among environments 12442565d0bSMatthew G. Knepley testset: 125*6c2b77d5SStefano Zampini requires: !defined(PETSC_HAVE_THREADSAFETY) 12630602db0SMatthew G. Knepley args: -malloc_requested_size -dm_plex_dim 3 -dm_plex_box_faces 5,5,5 -check_memory 0 127da87d8e5SMatthew G. Knepley 128da87d8e5SMatthew G. Knepley # Filter out label memory because tet mesher produce different surface meshes for different compilers 12942565d0bSMatthew G. Knepley test: 13042565d0bSMatthew G. Knepley suffix: tet 13142565d0bSMatthew G. Knepley requires: ctetgen 132da87d8e5SMatthew G. Knepley filter: grep -v "Label mem:" 13330602db0SMatthew G. Knepley args: -dm_plex_simplex 1 -dm_plex_interpolate 0 13442565d0bSMatthew G. Knepley 135da87d8e5SMatthew G. Knepley # Filter out label memory because tet mesher produce different surface meshes for different compilers 13642565d0bSMatthew G. Knepley test: 13742565d0bSMatthew G. Knepley suffix: tet_interp 13842565d0bSMatthew G. Knepley requires: ctetgen 139da87d8e5SMatthew G. Knepley filter: grep -v "Label mem:" 14030602db0SMatthew G. Knepley args: -dm_plex_simplex 1 -dm_plex_interpolate 1 14142565d0bSMatthew G. Knepley 14242565d0bSMatthew G. Knepley test: 14342565d0bSMatthew G. Knepley suffix: hex 14430602db0SMatthew G. Knepley args: -dm_plex_simplex 0 -dm_plex_interpolate 0 14542565d0bSMatthew G. Knepley 14642565d0bSMatthew G. Knepley test: 14742565d0bSMatthew G. Knepley suffix: hex_interp 14830602db0SMatthew G. Knepley args: -dm_plex_simplex 0 -dm_plex_interpolate 1 14942565d0bSMatthew G. Knepley TEST*/ 150