/* Code that allows a user to dictate what malloc() PETSc uses. */ #include /*I "petscsys.h" I*/ #include #if defined(PETSC_HAVE_MALLOC_H) #include #endif #if defined(PETSC_HAVE_MEMKIND) #include typedef enum {PETSC_MK_DEFAULT=0,PETSC_MK_HBW=1} PetscMemkindType; PetscMemkindType currentmktype = PETSC_MK_HBW; PetscMemkindType previousmktype = PETSC_MK_HBW; #endif /* We want to make sure that all mallocs of double or complex numbers are complex aligned. 1) on systems with memalign() we call that routine to get an aligned memory location 2) on systems without memalign() we - allocate one sizeof(PetscScalar) extra space - we shift the pointer up slightly if needed to get PetscScalar aligned - if shifted we store at ptr[-1] the amount of shift (plus a classid) */ #define SHIFT_CLASSID 456123 PetscErrorCode PetscMallocAlign(size_t mem,int line,const char func[],const char file[],void **result) { if (!mem) { *result = NULL; return 0; } #if defined(PETSC_HAVE_MEMKIND) { int ierr; if (!currentmktype) ierr = memkind_posix_memalign(MEMKIND_DEFAULT,result,PETSC_MEMALIGN,mem); else ierr = memkind_posix_memalign(MEMKIND_HBW,result,PETSC_MEMALIGN,mem); if (ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MEM,"Memory requested with memkind %.0f",(PetscLogDouble)mem); } #else # if defined(PETSC_HAVE_DOUBLE_ALIGN_MALLOC) && (PETSC_MEMALIGN == 8) *result = malloc(mem); # elif defined(PETSC_HAVE_MEMALIGN) *result = memalign(PETSC_MEMALIGN,mem); # else { /* malloc space for two extra chunks and shift ptr 1 + enough to get it PetscScalar aligned */ int *ptr = (int*)malloc(mem + 2*PETSC_MEMALIGN); if (ptr) { int shift = (int)(((PETSC_UINTPTR_T) ptr) % PETSC_MEMALIGN); shift = (2*PETSC_MEMALIGN - shift)/sizeof(int); ptr[shift-1] = shift + SHIFT_CLASSID; ptr += shift; *result = (void*)ptr; } else { *result = NULL; } } # endif #endif if (!*result) return PetscError(PETSC_COMM_SELF,line,func,file,PETSC_ERR_MEM,PETSC_ERROR_INITIAL,"Memory requested %.0f",(PetscLogDouble)mem); return 0; } PetscErrorCode PetscFreeAlign(void *ptr,int line,const char func[],const char file[]) { if (!ptr) return 0; #if defined(PETSC_HAVE_MEMKIND) memkind_free(0,ptr); /* specify the kind to 0 so that memkind will look up for the right type */ #else # if (!(defined(PETSC_HAVE_DOUBLE_ALIGN_MALLOC) && (PETSC_MEMALIGN == 8)) && !defined(PETSC_HAVE_MEMALIGN)) { /* Previous int tells us how many ints the pointer has been shifted from the original address provided by the system malloc(). */ int shift = *(((int*)ptr)-1) - SHIFT_CLASSID; if (shift > PETSC_MEMALIGN-1) return PetscError(PETSC_COMM_SELF,line,func,file,PETSC_ERR_PLIB,PETSC_ERROR_INITIAL,"Likely memory corruption in heap"); if (shift < 0) return PetscError(PETSC_COMM_SELF,line,func,file,PETSC_ERR_PLIB,PETSC_ERROR_INITIAL,"Likely memory corruption in heap"); ptr = (void*)(((int*)ptr) - shift); } # endif # if defined(PETSC_HAVE_FREE_RETURN_INT) int err = free(ptr); if (err) return PetscError(PETSC_COMM_SELF,line,func,file,PETSC_ERR_PLIB,PETSC_ERROR_INITIAL,"System free returned error %d\n",err); # else free(ptr); # endif #endif return 0; } PetscErrorCode PetscReallocAlign(size_t mem, int line, const char func[], const char file[], void **result) { PetscErrorCode ierr; if (!mem) { ierr = PetscFreeAlign(*result, line, func, file); if (ierr) return ierr; *result = NULL; return 0; } #if defined(PETSC_HAVE_MEMKIND) if (!currentmktype) *result = memkind_realloc(MEMKIND_DEFAULT,*result,mem); else *result = memkind_realloc(MEMKIND_HBW,*result,mem); #else # if (!(defined(PETSC_HAVE_DOUBLE_ALIGN_MALLOC) && (PETSC_MEMALIGN == 8)) && !defined(PETSC_HAVE_MEMALIGN)) { /* Previous int tells us how many ints the pointer has been shifted from the original address provided by the system malloc(). */ int shift = *(((int*)*result)-1) - SHIFT_CLASSID; if (shift > PETSC_MEMALIGN-1) return PetscError(PETSC_COMM_SELF,line,func,file,PETSC_ERR_PLIB,PETSC_ERROR_INITIAL,"Likely memory corruption in heap"); if (shift < 0) return PetscError(PETSC_COMM_SELF,line,func,file,PETSC_ERR_PLIB,PETSC_ERROR_INITIAL,"Likely memory corruption in heap"); *result = (void*)(((int*)*result) - shift); } # endif # if (defined(PETSC_HAVE_DOUBLE_ALIGN_MALLOC) && (PETSC_MEMALIGN == 8)) || defined(PETSC_HAVE_MEMALIGN) *result = realloc(*result, mem); # else { /* malloc space for two extra chunks and shift ptr 1 + enough to get it PetscScalar aligned */ int *ptr = (int *) realloc(*result, mem + 2*PETSC_MEMALIGN); if (ptr) { int shift = (int)(((PETSC_UINTPTR_T) ptr) % PETSC_MEMALIGN); shift = (2*PETSC_MEMALIGN - shift)/sizeof(int); ptr[shift-1] = shift + SHIFT_CLASSID; ptr += shift; *result = (void*)ptr; } else { *result = NULL; } } # endif #endif if (!*result) return PetscError(PETSC_COMM_SELF,line,func,file,PETSC_ERR_MEM,PETSC_ERROR_INITIAL,"Memory requested %.0f",(PetscLogDouble)mem); #if defined(PETSC_HAVE_MEMALIGN) /* There are no standard guarantees that realloc() maintains the alignment of memalign(), so I think we have to * realloc and, if the alignment is wrong, malloc/copy/free. */ if (((size_t) (*result)) % PETSC_MEMALIGN) { void *newResult; # if defined(PETSC_HAVE_MEMKIND) { int ierr; if (!currentmktype) ierr = memkind_posix_memalign(MEMKIND_DEFAULT,&newResult,PETSC_MEMALIGN,mem); else ierr = memkind_posix_memalign(MEMKIND_HBW,&newResult,PETSC_MEMALIGN,mem); if (ierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_MEM,"Memory requested with memkind %.0f",(PetscLogDouble)mem); } # else newResult = memalign(PETSC_MEMALIGN,mem); # endif if (!newResult) return PetscError(PETSC_COMM_SELF,line,func,file,PETSC_ERR_MEM,PETSC_ERROR_INITIAL,"Memory requested %.0f",(PetscLogDouble)mem); ierr = PetscMemcpy(newResult,*result,mem); if (ierr) return ierr; # if defined(PETSC_HAVE_FREE_RETURN_INT) { int err = free(*result); if (err) return PetscError(PETSC_COMM_SELF,line,func,file,PETSC_ERR_PLIB,PETSC_ERROR_INITIAL,"System free returned error %d\n",err); } # else # if defined(PETSC_HAVE_MEMKIND) memkind_free(0,*result); # else free(*result); # endif # endif *result = newResult; } #endif return 0; } PetscErrorCode (*PetscTrMalloc)(size_t,int,const char[],const char[],void**) = PetscMallocAlign; PetscErrorCode (*PetscTrFree)(void*,int,const char[],const char[]) = PetscFreeAlign; PetscErrorCode (*PetscTrRealloc)(size_t,int,const char[],const char[],void**) = PetscReallocAlign; PetscBool petscsetmallocvisited = PETSC_FALSE; /*@C PetscMallocSet - Sets the routines used to do mallocs and frees. This routine MUST be called before PetscInitialize() and may be called only once. Not Collective Input Parameters: + malloc - the malloc routine - free - the free routine Level: developer Concepts: malloc Concepts: memory^allocation @*/ PetscErrorCode PetscMallocSet(PetscErrorCode (*imalloc)(size_t,int,const char[],const char[],void**), PetscErrorCode (*ifree)(void*,int,const char[],const char[])) { PetscFunctionBegin; if (petscsetmallocvisited && (imalloc != PetscTrMalloc || ifree != PetscTrFree)) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"cannot call multiple times"); PetscTrMalloc = imalloc; PetscTrFree = ifree; petscsetmallocvisited = PETSC_TRUE; PetscFunctionReturn(0); } /*@C PetscMallocClear - Resets the routines used to do mallocs and frees to the defaults. Not Collective Level: developer Notes: In general one should never run a PETSc program with different malloc() and free() settings for different parts; this is because one NEVER wants to free() an address that was malloced by a different memory management system @*/ PetscErrorCode PetscMallocClear(void) { PetscFunctionBegin; PetscTrMalloc = PetscMallocAlign; PetscTrFree = PetscFreeAlign; petscsetmallocvisited = PETSC_FALSE; PetscFunctionReturn(0); } PetscErrorCode PetscMemoryTrace(const char label[]) { PetscErrorCode ierr; PetscLogDouble mem,mal; static PetscLogDouble oldmem = 0,oldmal = 0; PetscFunctionBegin; ierr = PetscMemoryGetCurrentUsage(&mem);CHKERRQ(ierr); ierr = PetscMallocGetCurrentUsage(&mal);CHKERRQ(ierr); ierr = PetscPrintf(PETSC_COMM_WORLD,"%s High water %8.3f MB increase %8.3f MB Current %8.3f MB increase %8.3f MB\n",label,mem*1e-6,(mem - oldmem)*1e-6,mal*1e-6,(mal - oldmal)*1e-6);CHKERRQ(ierr); oldmem = mem; oldmal = mal; PetscFunctionReturn(0); } static PetscErrorCode (*PetscTrMallocOld)(size_t,int,const char[],const char[],void**) = PetscMallocAlign; static PetscErrorCode (*PetscTrFreeOld)(void*,int,const char[],const char[]) = PetscFreeAlign; /*@C PetscMallocSetDRAM - Set PetscMalloc to use DRAM. If memkind is available, change the memkind type. Otherwise, switch the current malloc and free routines to the PetscMallocAlign and PetscFreeAlign (PETSc default). Not Collective Level: developer Notes: This provides a way to do the allocation on DRAM temporarily. One can switch back to the previous choice by calling PetscMallocReset(). .seealso: PetscMallocReset() @*/ PetscErrorCode PetscMallocSetDRAM(void) { PetscFunctionBegin; if (PetscTrMalloc == PetscMallocAlign) { #if defined(PETSC_HAVE_MEMKIND) previousmktype = currentmktype; currentmktype = PETSC_MK_DEFAULT; #endif } else { /* Save the previous choice */ PetscTrMallocOld = PetscTrMalloc; PetscTrFreeOld = PetscTrFree; PetscTrMalloc = PetscMallocAlign; PetscTrFree = PetscFreeAlign; } PetscFunctionReturn(0); } /*@C PetscMallocResetDRAM - Reset the changes made by PetscMallocSetDRAM Not Collective Level: developer .seealso: PetscMallocSetDRAM() @*/ PetscErrorCode PetscMallocResetDRAM(void) { PetscFunctionBegin; if (PetscTrMalloc == PetscMallocAlign) { #if defined(PETSC_HAVE_MEMKIND) currentmktype = previousmktype; #endif } else { /* Reset to the previous choice */ PetscTrMalloc = PetscTrMallocOld; PetscTrFree = PetscTrFreeOld; } PetscFunctionReturn(0); } static PetscBool petscmalloccoalesce = #if defined(PETSC_USE_MALLOC_COALESCED) PETSC_TRUE; #else PETSC_FALSE; #endif /*@C PetscMallocSetCoalesce - Use coalesced malloc when allocating groups of objects Not Collective Input Parameters: . coalesce - PETSC_TRUE to use coalesced malloc for multi-object allocation. Options Database Keys: . -malloc_coalesce - turn coalesced malloc on or off Note: PETSc uses coalesced malloc by default for optimized builds and not for debugging builds. This default can be changed via the command-line option -malloc_coalesce or by calling this function. Level: developer .seealso: PetscMallocA() @*/ PetscErrorCode PetscMallocSetCoalesce(PetscBool coalesce) { PetscFunctionBegin; petscmalloccoalesce = coalesce; PetscFunctionReturn(0); } /*@C PetscMallocA - Allocate and optionally clear one or more objects, possibly using coalesced malloc Not Collective Input Parameters: + n - number of objects to allocate (at least 1) . lineno - line number to attribute allocation (typically __LINE__) . function - function to attribute allocation (typically PETSC_FUNCTION_NAME) . filename - file name to attribute allocation (typically __FILE__) - bytes0 - first of n object sizes Output Parameters: . ptr0 - first of n pointers to allocate Notes: This function is not normally called directly by users, but rather via the macros PetscMalloc1(), PetscMalloc2(), or PetscCalloc1(), etc. Level: developer .seealso: PetscMallocAlign(), PetscMallocSet(), PetscMalloc1(), PetscMalloc2(), PetscMalloc3(), PetscMalloc4(), PetscMalloc5(), PetscMalloc6(), PetscMalloc7(), PetscCalloc1(), PetscCalloc2(), PetscCalloc3(), PetscCalloc4(), PetscCalloc5(), PetscCalloc6(), PetscCalloc7(), PetscFreeA() @*/ PetscErrorCode PetscMallocA(int n,PetscBool clear,int lineno,const char *function,const char *filename,size_t bytes0,void *ptr0,...) { PetscErrorCode ierr; va_list Argp; size_t bytes[8],sumbytes; void **ptr[8]; int i; PetscFunctionBegin; if (n > 8) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Attempt to allocate %d objects but only 8 supported",n); bytes[0] = bytes0; ptr[0] = (void**)ptr0; sumbytes = (bytes0 + PETSC_MEMALIGN-1) & ~(PETSC_MEMALIGN-1); va_start(Argp,ptr0); for (i=1; i 8) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Attempt to allocate %d objects but only 8 supported",n); ptr[0] = (void**)ptr0; va_start(Argp,ptr0); for (i=1; i i) { *ptr[n] = NULL; } ierr = (*PetscTrFree)(*ptr[n],lineno,function,filename);CHKERRQ(ierr); *ptr[n] = NULL; } else { while (--n >= 0) { ierr = (*PetscTrFree)(*ptr[n],lineno,function,filename);CHKERRQ(ierr); *ptr[n] = NULL; } } PetscFunctionReturn(0); }