Lines Matching refs:h_b
531 float *h_a, *h_b, *h_c; in runStream() local
538 if ((h_b = (float *)calloc(N, sizeof(float))) == (float *)NULL) { in runStream()
587 PetscCallCUDA(cudaMemcpy(h_b, d_b, sizeof(float) * N, cudaMemcpyDeviceToHost)); in runStream()
589 errorSTREAMkernel = STREAM_Scale_verify(h_b, h_c, scalar, N); in runStream()
602 PetscCallCUDA(cudaMemcpy(h_b, d_b, sizeof(float) * N, cudaMemcpyDeviceToHost)); in runStream()
604 errorSTREAMkernel = STREAM_Add_verify(h_a, h_b, h_c, N); in runStream()
617 PetscCallCUDA(cudaMemcpy(h_b, d_b, sizeof(float) * N, cudaMemcpyDeviceToHost)); in runStream()
619 errorSTREAMkernel = STREAM_Triad_verify(h_b, h_c, h_a, scalar, N); in runStream()
626 free(h_b); in runStream()
745 double *h_a, *h_b, *h_c; in runStreamDouble() local
752 if ((h_b = (double *)calloc(N, sizeof(double))) == (double *)NULL) { in runStreamDouble()
800 PetscCallCUDA(cudaMemcpy(h_b, d_b, sizeof(double) * N, cudaMemcpyDeviceToHost)); in runStreamDouble()
802 errorSTREAMkernel = STREAM_Scale_verify_double(h_b, h_c, scalar, N); in runStreamDouble()
815 PetscCallCUDA(cudaMemcpy(h_b, d_b, sizeof(double) * N, cudaMemcpyDeviceToHost)); in runStreamDouble()
817 errorSTREAMkernel = STREAM_Add_verify_double(h_a, h_b, h_c, N); in runStreamDouble()
830 PetscCallCUDA(cudaMemcpy(h_b, d_b, sizeof(double) * N, cudaMemcpyDeviceToHost)); in runStreamDouble()
832 errorSTREAMkernel = STREAM_Triad_verify_double(h_b, h_c, h_a, scalar, N); in runStreamDouble()
839 free(h_b); in runStreamDouble()