1e5c89e4eSSatish Balay #define PETSC_DLL 2e5c89e4eSSatish Balay 3e5c89e4eSSatish Balay /* 4e5c89e4eSSatish Balay We define the memory operations here. The reason we just do not use 5e5c89e4eSSatish Balay the standard memory routines in the PETSc code is that on some machines 6e5c89e4eSSatish Balay they are broken. 7e5c89e4eSSatish Balay 8e5c89e4eSSatish Balay */ 9e5c89e4eSSatish Balay #include "petsc.h" /*I "petsc.h" I*/ 10e5c89e4eSSatish Balay #include "src/inline/axpy.h" 11e5c89e4eSSatish Balay 12e5c89e4eSSatish Balay /* 13e5c89e4eSSatish Balay On the IBM Rs6000 using the Gnu G++ compiler you may have to include 14e5c89e4eSSatish Balay <string.h> instead of <memory.h> 15e5c89e4eSSatish Balay */ 16e5c89e4eSSatish Balay #include <memory.h> 17e5c89e4eSSatish Balay #if defined(PETSC_HAVE_STRINGS_H) 18e5c89e4eSSatish Balay #include <strings.h> 19e5c89e4eSSatish Balay #endif 20e5c89e4eSSatish Balay #if defined(PETSC_HAVE_STRING_H) 21e5c89e4eSSatish Balay #include <string.h> 22e5c89e4eSSatish Balay #endif 23e5c89e4eSSatish Balay #if defined(PETSC_HAVE_STDLIB_H) 24e5c89e4eSSatish Balay #include <stdlib.h> 25e5c89e4eSSatish Balay #endif 26e5c89e4eSSatish Balay #include "petscfix.h" 27e5c89e4eSSatish Balay #include "petscbt.h" 28e5c89e4eSSatish Balay #if defined(PETSC_PREFER_DCOPY_FOR_MEMCPY) 29e5c89e4eSSatish Balay #include "petscblaslapack.h" 30e5c89e4eSSatish Balay #endif 31e5c89e4eSSatish Balay 32e5c89e4eSSatish Balay #undef __FUNCT__ 33e5c89e4eSSatish Balay #define __FUNCT__ "PetscMemcpy" 34e30d2299SSatish Balay /*@ 35e5c89e4eSSatish Balay PetscMemcpy - Copies n bytes, beginning at location b, to the space 36e5c89e4eSSatish Balay beginning at location a. The two memory regions CANNOT overlap, use 37e5c89e4eSSatish Balay PetscMemmove() in that case. 38e5c89e4eSSatish Balay 39e5c89e4eSSatish Balay Not Collective 40e5c89e4eSSatish Balay 41e5c89e4eSSatish Balay Input Parameters: 42e5c89e4eSSatish Balay + b - pointer to initial memory space 43e5c89e4eSSatish Balay - n - length (in bytes) of space to copy 44e5c89e4eSSatish Balay 45e5c89e4eSSatish Balay Output Parameter: 46e5c89e4eSSatish Balay . a - pointer to copy space 47e5c89e4eSSatish Balay 48e5c89e4eSSatish Balay Level: intermediate 49e5c89e4eSSatish Balay 50e5c89e4eSSatish Balay Compile Option: 51e5c89e4eSSatish Balay PETSC_PREFER_DCOPY_FOR_MEMCPY will cause the BLAS dcopy() routine to be used 52e5c89e4eSSatish Balay for memory copies on double precision values. 53e5c89e4eSSatish Balay PETSC_PREFER_COPY_FOR_MEMCPY will cause C code to be used 54e5c89e4eSSatish Balay for memory copies on double precision values. 55e5c89e4eSSatish Balay PETSC_PREFER_FORTRAN_FORMEMCPY will cause Fortran code to be used 56e5c89e4eSSatish Balay for memory copies on double precision values. 57e5c89e4eSSatish Balay 58e5c89e4eSSatish Balay Note: 59e5c89e4eSSatish Balay This routine is analogous to memcpy(). 60e5c89e4eSSatish Balay 61e5c89e4eSSatish Balay Concepts: memory^copying 62e5c89e4eSSatish Balay Concepts: copying^memory 63e5c89e4eSSatish Balay 64e5c89e4eSSatish Balay .seealso: PetscMemmove() 65e5c89e4eSSatish Balay 66e5c89e4eSSatish Balay @*/ 67e5c89e4eSSatish Balay PetscErrorCode PETSC_DLLEXPORT PetscMemcpy(void *a,const void *b,size_t n) 68e5c89e4eSSatish Balay { 69e5c89e4eSSatish Balay unsigned long al = (unsigned long) a,bl = (unsigned long) b; 70e5c89e4eSSatish Balay unsigned long nl = (unsigned long) n; 71e5c89e4eSSatish Balay 72e5c89e4eSSatish Balay PetscFunctionBegin; 73e5c89e4eSSatish Balay if (n > 0 && !b) SETERRQ(PETSC_ERR_ARG_NULL,"Trying to copy from a null pointer"); 74e5c89e4eSSatish Balay if (n > 0 && !a) SETERRQ(PETSC_ERR_ARG_NULL,"Trying to copy to a null pointer"); 75e5c89e4eSSatish Balay if (a != b) { 76e5c89e4eSSatish Balay #if !defined(PETSC_HAVE_CRAY90_POINTER) 77e5c89e4eSSatish Balay if ((al > bl && (al - bl) < nl) || (bl - al) < nl) { 78e5c89e4eSSatish Balay SETERRQ3(PETSC_ERR_ARG_INCOMP,"Memory regions overlap: either use PetscMemmov()\n\ 79e5c89e4eSSatish Balay or make sure your copy regions and lengths are correct. \n\ 80e5c89e4eSSatish Balay Length (bytes) %ld first address %ld second address %ld",nl,al,bl); 81e5c89e4eSSatish Balay } 82e5c89e4eSSatish Balay #endif 83e5c89e4eSSatish Balay #if (defined(PETSC_PREFER_DCOPY_FOR_MEMCPY) || defined(PETSC_PREFER_COPY_FOR_MEMCPY) || defined(PETSC_PREFER_FORTRAN_FORMEMCPY)) 84e5c89e4eSSatish Balay if (!(((long) a) % sizeof(PetscScalar)) && !(n % sizeof(PetscScalar))) { 85e5c89e4eSSatish Balay size_t len = n/sizeof(PetscScalar); 86e5c89e4eSSatish Balay #if defined(PETSC_PREFER_DCOPY_FOR_MEMCPY) 87e5c89e4eSSatish Balay PetscBLASInt blen = (PetscBLASInt) len,one = 1; 88e5c89e4eSSatish Balay BLAScopy_(&blen,(PetscScalar *)b,&one,(PetscScalar *)a,&one); 89e5c89e4eSSatish Balay #elif defined(PETSC_PREFER_FORTRAN_FORMEMCPY) 90e5c89e4eSSatish Balay fortrancopy_(&len,(PetscScalar*)b,(PetscScalar*)a); 91e5c89e4eSSatish Balay #else 92e5c89e4eSSatish Balay size_t i; 93e5c89e4eSSatish Balay PetscScalar *x = (PetscScalar*)b, *y = (PetscScalar*)a; 94e5c89e4eSSatish Balay for (i=0; i<len; i++) y[i] = x[i]; 95e5c89e4eSSatish Balay #endif 96e5c89e4eSSatish Balay } else { 97e5c89e4eSSatish Balay memcpy((char*)(a),(char*)(b),n); 98e5c89e4eSSatish Balay } 991b54b3b6SSatish Balay #elif defined(PETSC_HAVE__INTEL_FAST_MEMCPY) 1001b54b3b6SSatish Balay _intel_fast_memcpy((char*)(a),(char*)(b),n); 101e5c89e4eSSatish Balay #else 102e5c89e4eSSatish Balay memcpy((char*)(a),(char*)(b),n); 103e5c89e4eSSatish Balay #endif 104e5c89e4eSSatish Balay } 105e5c89e4eSSatish Balay PetscFunctionReturn(0); 106e5c89e4eSSatish Balay } 107e5c89e4eSSatish Balay 108e5c89e4eSSatish Balay #undef __FUNCT__ 109e5c89e4eSSatish Balay #define __FUNCT__ "PetscBitMemcpy" 110e5c89e4eSSatish Balay /*@C 111e5c89e4eSSatish Balay PetscBitMemcpy - Copies an amount of data. This can include bit data. 112e5c89e4eSSatish Balay 113e5c89e4eSSatish Balay Not Collective 114e5c89e4eSSatish Balay 115e5c89e4eSSatish Balay Input Parameters: 116e5c89e4eSSatish Balay + b - pointer to initial memory space 117e5c89e4eSSatish Balay . bi - offset of initial memory space (in elementary chunk sizes) 118e5c89e4eSSatish Balay . bs - length (in elementary chunk sizes) of space to copy 119e5c89e4eSSatish Balay - dtype - datatype, for example, PETSC_INT, PETSC_DOUBLE, PETSC_LOGICAL 120e5c89e4eSSatish Balay 121e5c89e4eSSatish Balay Output Parameters: 122e5c89e4eSSatish Balay + a - pointer to result memory space 123e5c89e4eSSatish Balay - ai - offset of result memory space (in elementary chunk sizes) 124e5c89e4eSSatish Balay 125e5c89e4eSSatish Balay Level: intermediate 126e5c89e4eSSatish Balay 127e5c89e4eSSatish Balay Note: 128e5c89e4eSSatish Balay This routine is analogous to PetscMemcpy(), except when the data type is 129e5c89e4eSSatish Balay PETSC_LOGICAL. 130e5c89e4eSSatish Balay 131e5c89e4eSSatish Balay Concepts: memory^comparing 132e5c89e4eSSatish Balay Concepts: comparing^memory 133e5c89e4eSSatish Balay 134e5c89e4eSSatish Balay .seealso: PetscMemmove(), PetscMemcpy() 135e5c89e4eSSatish Balay 136e5c89e4eSSatish Balay @*/ 137e5c89e4eSSatish Balay PetscErrorCode PETSC_DLLEXPORT PetscBitMemcpy(void *a,PetscInt ai,const void *b,PetscInt bi,PetscInt bs,PetscDataType dtype) 138e5c89e4eSSatish Balay { 139e5c89e4eSSatish Balay char *aa = (char *)a,*bb = (char *)b; 140*2ad021e3SSatish Balay size_t dsize; 141e5c89e4eSSatish Balay PetscErrorCode ierr; 142e5c89e4eSSatish Balay 143e5c89e4eSSatish Balay PetscFunctionBegin; 144e5c89e4eSSatish Balay if (bs > 0 && !b) SETERRQ(PETSC_ERR_ARG_NULL,"Trying to copy from a null pointer"); 145e5c89e4eSSatish Balay if (bs > 0 && !a) SETERRQ(PETSC_ERR_ARG_NULL,"Trying to copy to a null pointer"); 146e5c89e4eSSatish Balay if (dtype != PETSC_LOGICAL) { 147e5c89e4eSSatish Balay ierr = PetscDataTypeGetSize(dtype,&dsize);CHKERRQ(ierr); 148e5c89e4eSSatish Balay ierr = PetscMemcpy(aa+ai*dsize,bb+bi*dsize,bs*dsize);CHKERRQ(ierr); 149e5c89e4eSSatish Balay } else { 150e5c89e4eSSatish Balay PetscBT at = (PetscBT) a; 151e5c89e4eSSatish Balay PetscBT bt = (PetscBT) b; 152e5c89e4eSSatish Balay PetscInt i; 153e5c89e4eSSatish Balay for (i=0; i<bs; i++) { 154e5c89e4eSSatish Balay if (PetscBTLookup(bt,bi+i)) {ierr = PetscBTSet(at,ai+i);CHKERRQ(ierr);} 155e5c89e4eSSatish Balay else {ierr = PetscBTClear(at,ai+i);CHKERRQ(ierr);} 156e5c89e4eSSatish Balay } 157e5c89e4eSSatish Balay } 158e5c89e4eSSatish Balay PetscFunctionReturn(0); 159e5c89e4eSSatish Balay } 160e5c89e4eSSatish Balay 161e5c89e4eSSatish Balay #undef __FUNCT__ 162e5c89e4eSSatish Balay #define __FUNCT__ "PetscMemzero" 163e30d2299SSatish Balay /*@ 164e5c89e4eSSatish Balay PetscMemzero - Zeros the specified memory. 165e5c89e4eSSatish Balay 166e5c89e4eSSatish Balay Not Collective 167e5c89e4eSSatish Balay 168e5c89e4eSSatish Balay Input Parameters: 169e5c89e4eSSatish Balay + a - pointer to beginning memory location 170e5c89e4eSSatish Balay - n - length (in bytes) of memory to initialize 171e5c89e4eSSatish Balay 172e5c89e4eSSatish Balay Level: intermediate 173e5c89e4eSSatish Balay 174e5c89e4eSSatish Balay Compile Option: 175e5c89e4eSSatish Balay PETSC_PREFER_BZERO - on certain machines (the IBM RS6000) the bzero() routine happens 176e5c89e4eSSatish Balay to be faster than the memset() routine. This flag causes the bzero() routine to be used. 177e5c89e4eSSatish Balay 178e5c89e4eSSatish Balay Concepts: memory^zeroing 179e5c89e4eSSatish Balay Concepts: zeroing^memory 180e5c89e4eSSatish Balay 181e5c89e4eSSatish Balay .seealso: PetscMemcpy() 182e5c89e4eSSatish Balay @*/ 183e5c89e4eSSatish Balay PetscErrorCode PETSC_DLLEXPORT PetscMemzero(void *a,size_t n) 184e5c89e4eSSatish Balay { 185e5c89e4eSSatish Balay PetscFunctionBegin; 186e5c89e4eSSatish Balay if (n > 0) { 187e5c89e4eSSatish Balay if (!a) SETERRQ(PETSC_ERR_ARG_NULL,"Trying to zero at a null pointer"); 188e5c89e4eSSatish Balay #if defined(PETSC_PREFER_ZERO_FOR_MEMZERO) 189e5c89e4eSSatish Balay if (!(((long) a) % sizeof(PetscScalar)) && !(n % sizeof(PetscScalar))) { 190e5c89e4eSSatish Balay size_t i,len = n/sizeof(PetscScalar); 191e5c89e4eSSatish Balay PetscScalar *x = (PetscScalar*)a; 192e5c89e4eSSatish Balay for (i=0; i<len; i++) x[i] = 0.0; 193e5c89e4eSSatish Balay } else { 194e5c89e4eSSatish Balay #elif defined(PETSC_PREFER_FORTRAN_FOR_MEMZERO) 195e5c89e4eSSatish Balay if (!(((long) a) % sizeof(PetscScalar)) && !(n % sizeof(PetscScalar))) { 196e5c89e4eSSatish Balay PetscInt len = n/sizeof(PetscScalar); 197e5c89e4eSSatish Balay fortranzero_(&len,(PetscScalar*)a); 198e5c89e4eSSatish Balay } else { 199e5c89e4eSSatish Balay #endif 200e5c89e4eSSatish Balay #if defined(PETSC_PREFER_BZERO) 201e5c89e4eSSatish Balay bzero((char *)a,n); 2021b54b3b6SSatish Balay #elif defined (PETSC_HAVE__INTEL_FAST_MEMSET) 2031b54b3b6SSatish Balay _intel_fast_memset((char*)a,0,n); 204e5c89e4eSSatish Balay #else 205e5c89e4eSSatish Balay memset((char*)a,0,n); 206e5c89e4eSSatish Balay #endif 207e5c89e4eSSatish Balay #if defined(PETSC_PREFER_ZERO_FOR_MEMZERO) || defined(PETSC_PREFER_FORTRAN_FOR_MEMZERO) 208e5c89e4eSSatish Balay } 209e5c89e4eSSatish Balay #endif 210e5c89e4eSSatish Balay } 211e5c89e4eSSatish Balay PetscFunctionReturn(0); 212e5c89e4eSSatish Balay } 213e5c89e4eSSatish Balay 214e5c89e4eSSatish Balay #undef __FUNCT__ 215e5c89e4eSSatish Balay #define __FUNCT__ "PetscMemcmp" 216e5c89e4eSSatish Balay /*@C 217e5c89e4eSSatish Balay PetscMemcmp - Compares two byte streams in memory. 218e5c89e4eSSatish Balay 219e5c89e4eSSatish Balay Not Collective 220e5c89e4eSSatish Balay 221e5c89e4eSSatish Balay Input Parameters: 222e5c89e4eSSatish Balay + str1 - Pointer to the first byte stream 223e5c89e4eSSatish Balay . str2 - Pointer to the second byte stream 224e5c89e4eSSatish Balay - len - The length of the byte stream 225e5c89e4eSSatish Balay (both str1 and str2 are assumed to be of length len) 226e5c89e4eSSatish Balay 227e5c89e4eSSatish Balay Output Parameters: 228e5c89e4eSSatish Balay . e - PETSC_TRUE if equal else PETSC_FALSE. 229e5c89e4eSSatish Balay 230e5c89e4eSSatish Balay Level: intermediate 231e5c89e4eSSatish Balay 232e5c89e4eSSatish Balay Note: 233e5c89e4eSSatish Balay This routine is anologous to memcmp() 234e5c89e4eSSatish Balay @*/ 235e5c89e4eSSatish Balay PetscErrorCode PETSC_DLLEXPORT PetscMemcmp(const void *str1,const void *str2,size_t len,PetscTruth *e) 236e5c89e4eSSatish Balay { 237e5c89e4eSSatish Balay int r; 238e5c89e4eSSatish Balay 239e5c89e4eSSatish Balay PetscFunctionBegin; 240e5c89e4eSSatish Balay if (len > 0 && !str1) SETERRQ(PETSC_ERR_ARG_NULL,"Trying to compare at a null pointer"); 241e5c89e4eSSatish Balay if (len > 0 && !str2) SETERRQ(PETSC_ERR_ARG_NULL,"Trying to compare at a null pointer"); 242e5c89e4eSSatish Balay r = memcmp((char *)str1,(char *)str2,len); 243e5c89e4eSSatish Balay if (!r) *e = PETSC_TRUE; 244e5c89e4eSSatish Balay else *e = PETSC_FALSE; 245e5c89e4eSSatish Balay PetscFunctionReturn(0); 246e5c89e4eSSatish Balay } 247e5c89e4eSSatish Balay 248e5c89e4eSSatish Balay #undef __FUNCT__ 249e5c89e4eSSatish Balay #define __FUNCT__ "PetscMemmove" 250e5c89e4eSSatish Balay /*@C 251e5c89e4eSSatish Balay PetscMemmove - Copies n bytes, beginning at location b, to the space 252e5c89e4eSSatish Balay beginning at location a. Copying between regions that overlap will 253e5c89e4eSSatish Balay take place correctly. 254e5c89e4eSSatish Balay 255e5c89e4eSSatish Balay Not Collective 256e5c89e4eSSatish Balay 257e5c89e4eSSatish Balay Input Parameters: 258e5c89e4eSSatish Balay + b - pointer to initial memory space 259e5c89e4eSSatish Balay - n - length (in bytes) of space to copy 260e5c89e4eSSatish Balay 261e5c89e4eSSatish Balay Output Parameter: 262e5c89e4eSSatish Balay . a - pointer to copy space 263e5c89e4eSSatish Balay 264e5c89e4eSSatish Balay Level: intermediate 265e5c89e4eSSatish Balay 266e5c89e4eSSatish Balay Note: 267e5c89e4eSSatish Balay This routine is analogous to memmove(). 268e5c89e4eSSatish Balay 269e5c89e4eSSatish Balay Concepts: memory^copying with overlap 270e5c89e4eSSatish Balay Concepts: copying^memory with overlap 271e5c89e4eSSatish Balay 272e5c89e4eSSatish Balay .seealso: PetscMemcpy() 273e5c89e4eSSatish Balay @*/ 274e5c89e4eSSatish Balay PetscErrorCode PETSC_DLLEXPORT PetscMemmove(void *a,void *b,size_t n) 275e5c89e4eSSatish Balay { 276e5c89e4eSSatish Balay PetscFunctionBegin; 277e5c89e4eSSatish Balay if (n > 0 && !a) SETERRQ(PETSC_ERR_ARG_NULL,"Trying to copy to null pointer"); 278e5c89e4eSSatish Balay if (n > 0 && !b) SETERRQ(PETSC_ERR_ARG_NULL,"Trying to copy from a null pointer"); 279e5c89e4eSSatish Balay #if !defined(PETSC_HAVE_MEMMOVE) 280e5c89e4eSSatish Balay if (a < b) { 281e5c89e4eSSatish Balay if (a <= b - n) { 282e5c89e4eSSatish Balay memcpy(a,b,n); 283e5c89e4eSSatish Balay } else { 284e5c89e4eSSatish Balay memcpy(a,b,(int)(b - a)); 285e5c89e4eSSatish Balay PetscMemmove(b,b + (int)(b - a),n - (int)(b - a)); 286e5c89e4eSSatish Balay } 287e5c89e4eSSatish Balay } else { 288e5c89e4eSSatish Balay if (b <= a - n) { 289e5c89e4eSSatish Balay memcpy(a,b,n); 290e5c89e4eSSatish Balay } else { 291e5c89e4eSSatish Balay memcpy(b + n,b + (n - (int)(a - b)),(int)(a - b)); 292e5c89e4eSSatish Balay PetscMemmove(a,b,n - (int)(a - b)); 293e5c89e4eSSatish Balay } 294e5c89e4eSSatish Balay } 295e5c89e4eSSatish Balay #else 296e5c89e4eSSatish Balay memmove((char*)(a),(char*)(b),n); 297e5c89e4eSSatish Balay #endif 298e5c89e4eSSatish Balay PetscFunctionReturn(0); 299e5c89e4eSSatish Balay } 300e5c89e4eSSatish Balay 301e5c89e4eSSatish Balay 302e5c89e4eSSatish Balay 303e5c89e4eSSatish Balay 304