#ifdef PETSC_RCS_HEADER static char vcid[] = "$Id: Index.c,v 1.22 1999/05/04 20:38:02 balay Exp balay $"; #endif #include "petsc.h" #include "sys.h" extern int BlastCache(void); extern int test1(void); extern int test2(void); #undef __FUNC__ #define __FUNC__ "main" int main( int argc, char **argv) { int ierr; PetscInitialize(&argc, &argv,0,0); ierr = test1();CHKERRA(ierr); ierr = test2();CHKERRA(ierr); PetscFinalize(); PetscFunctionReturn(0); } #undef __FUNC__ #define __FUNC__ "test1" int test1(void) { PLogDouble t1, t2; double value; int i, ierr,*z,*zi, intval; Scalar *x, *y; PetscRandom r; ierr = PetscRandomCreate(PETSC_COMM_SELF,RANDOM_DEFAULT,&r);CHKERRQ(ierr); x = (Scalar *)PetscMalloc(20000*sizeof(Scalar));CHKPTRA(x); y = (Scalar *)PetscMalloc(20000*sizeof(Scalar));CHKPTRA(y); z = (int *)PetscMalloc(2000*sizeof(int));CHKPTRA(z); zi = (int *)PetscMalloc(2000*sizeof(int));CHKPTRA(zi); /* Take care of paging effects */ ierr = PetscGetTime(&t1);CHKERRQ(ierr); /* Form the random set of integers */ for (i=0; i<2000; i++) { ierr = PetscRandomGetValue(r, &value);CHKERRQ(ierr); intval = (int)(value*20000.0); z[i] = intval; } for (i=0; i<2000; i++) { ierr = PetscRandomGetValue(r, &value);CHKERRQ(ierr); intval = (int)(value*20000.0); zi[i] = intval; } fprintf(stderr,"Done setup\n"); ierr = BlastCache();CHKERRQ(ierr); ierr = PetscGetTime(&t1);CHKERRQ(ierr); for (i=0; i<2000; i++) { x[i] = y[i]; } ierr = PetscGetTime(&t2);CHKERRQ(ierr); fprintf(stderr,"%-19s : %e sec\n","x[i] = y[i]",(t2-t1)/2000.0); ierr = BlastCache();CHKERRQ(ierr); ierr = PetscGetTime(&t1);CHKERRQ(ierr); for (i=0; i<500; i+=4) { x[i] = y[z[i]]; x[1+i] = y[z[1+i]]; x[2+i] = y[z[2+i]]; x[3+i] = y[z[3+i]]; } ierr = PetscGetTime(&t2);CHKERRQ(ierr); fprintf(stderr,"%-19s : %e sec\n","x[i] = y[idx[i]] - unroll 4",(t2-t1)/2000.0); ierr = BlastCache();CHKERRQ(ierr); ierr = PetscGetTime(&t1);CHKERRQ(ierr) for (i=0; i<2000; i++) { x[i] = y[z[i]]; } ierr = PetscGetTime(&t2);CHKERRQ(ierr); fprintf(stderr,"%-19s : %e sec\n","x[i] = y[idx[i]]",(t2-t1)/2000.0); ierr = BlastCache();CHKERRQ(ierr); ierr = PetscGetTime(&t1);CHKERRQ(ierr); for (i=0; i<1000; i+=2) { x[i] = y[z[i]]; x[1+i] = y[z[1+i]]; } ierr = PetscGetTime(&t2);CHKERRQ(ierr); fprintf(stderr,"%-19s : %e sec\n","x[i] = y[idx[i]] - unroll 2",(t2-t1)/2000.0); ierr = BlastCache();CHKERRQ(ierr); ierr = PetscGetTime(&t1);CHKERRQ(ierr); for (i=0; i<2000; i++) { x[z[i]] = y[i]; } ierr = PetscGetTime(&t2);CHKERRQ(ierr); fprintf(stderr,"%-19s : %e sec\n","x[z[i]] = y[i]",(t2-t1)/2000.0); ierr = BlastCache();CHKERRQ(ierr); ierr = PetscGetTime(&t1);CHKERRQ(ierr); for (i=0; i<2000; i++) { x[z[i]] = y[zi[i]]; } ierr = PetscGetTime(&t2);CHKERRQ(ierr); fprintf(stderr,"%-19s : %e sec\n","x[z[i]] = y[zi[i]]",(t2-t1)/2000.0); ierr = PetscMemcpy(x,y,10);CHKERRQ(ierr); ierr = PetscMemcpy(z,zi,10);CHKERRQ(ierr); ierr = PetscFree(z);CHKERRQ(ierr); ierr = PetscFree(zi);CHKERRQ(ierr); ierr = PetscFree(x);CHKERRQ(ierr); ierr = PetscFree(y);CHKERRQ(ierr); PetscRandomDestroy(r); PetscFunctionReturn(0); } #undef __FUNC__ #define __FUNC__ "test2" int test2(void) { PLogDouble t1, t2; double value; int i, ierr,z[20000],zi[20000], intval, tmp; Scalar x[20000], y[20000]; PetscRandom r; ierr = PetscRandomCreate(PETSC_COMM_SELF,RANDOM_DEFAULT,&r);CHKERRQ(ierr); /* Take care of paging effects */ ierr = PetscGetTime(&t1);CHKERRQ(ierr); for (i=0; i<20000; i++) { x[i] = i; y[i] = i; z[i] = i; zi[i] = i; } /* Form the random set of integers */ for (i=0; i<20000; i++) { ierr = PetscRandomGetValue(r, &value);CHKERRQ(ierr); intval = (int)(value*20000.0); tmp = z[i]; z[i] = z[intval]; z[intval] = tmp; } for (i=0; i<20000; i++) { ierr = PetscRandomGetValue(r, &value);CHKERRQ(ierr); intval = (int)(value*20000.0); tmp = zi[i]; zi[i] = zi[intval]; zi[intval] = tmp; } fprintf(stderr,"Done setup\n"); /* ierr = BlastCache();CHKERRQ(ierr); */ ierr = PetscGetTime(&t1);CHKERRQ(ierr); for (i=0; i<2000; i++) { x[i] = y[i]; } ierr = PetscGetTime(&t2);CHKERRQ(ierr); fprintf(stderr,"%-19s : %e sec\n","x[i] = y[i]",(t2-t1)/2000.0); /* ierr = BlastCache();CHKERRQ(ierr); */ ierr = PetscGetTime(&t1);CHKERRQ(ierr); for (i=0; i<2000; i++) { y[i] = x[z[i]]; } ierr = PetscGetTime(&t2);CHKERRQ(ierr); fprintf(stderr,"%-19s : %e sec\n","x[i] = y[idx[i]]",(t2-t1)/2000.0); /* ierr = BlastCache();CHKERRQ(ierr); */ ierr = PetscGetTime(&t1);CHKERRQ(ierr); for (i=0; i<2000; i++) { x[z[i]] = y[i]; } ierr = PetscGetTime(&t2);CHKERRQ(ierr); fprintf(stderr,"%-19s : %e sec\n","x[z[i]] = y[i]",(t2-t1)/2000.0); /* ierr = BlastCache();CHKERRQ(ierr); */ ierr = PetscGetTime(&t1);CHKERRQ(ierr); for (i=0; i<2000; i++) { y[z[i]] = x[zi[i]]; } ierr = PetscGetTime(&t2);CHKERRQ(ierr); fprintf(stderr,"%-19s : %e sec\n","x[z[i]] = y[zi[i]]",(t2-t1)/2000.0); PetscRandomDestroy(r); PetscFunctionReturn(0); } #undef __FUNC__ #define __FUNC__ "BlastCache" int BlastCache(void) { int i,n = 1000000; Scalar *x,*y,*z,*a, *b; x = (Scalar *) PetscMalloc(5*n*sizeof(Scalar));CHKPTRA(x); y = x + n; z = y + n; a = z + n; b = a + n; for ( i=0; i