Lines Matching refs:A2

707 …__m256d  S0, S1, S2, S3, S4, S5, S6, S7, S8, B0, B1, B2, B6, B7, B8, A0, A1, A2, A3, A4, A5, A6, A…  in PetscKernel_A_gets_A_times_B_9()  local
723 A2 = _mm256_loadu_pd(W + 8); in PetscKernel_A_gets_A_times_B_9()
729 S2 = _mm256_fmadd_pd(A2, B0, S2); in PetscKernel_A_gets_A_times_B_9()
732 S5 = _mm256_fmadd_pd(A2, B1, S5); in PetscKernel_A_gets_A_times_B_9()
735 S8 = _mm256_fmadd_pd(A2, B2, S8); in PetscKernel_A_gets_A_times_B_9()
771 A2 = _mm256_loadu_pd(W + 35); in PetscKernel_A_gets_A_times_B_9()
777 S2 = _mm256_fmadd_pd(A2, B6, S2); in PetscKernel_A_gets_A_times_B_9()
780 S5 = _mm256_fmadd_pd(A2, B7, S5); in PetscKernel_A_gets_A_times_B_9()
783 S8 = _mm256_fmadd_pd(A2, B8, S8); in PetscKernel_A_gets_A_times_B_9()
803 A2 = _mm256_loadu_pd(W + 53); in PetscKernel_A_gets_A_times_B_9()
809 S2 = _mm256_fmadd_pd(A2, B6, S2); in PetscKernel_A_gets_A_times_B_9()
812 S5 = _mm256_fmadd_pd(A2, B7, S5); in PetscKernel_A_gets_A_times_B_9()
815 S8 = _mm256_fmadd_pd(A2, B8, S8); in PetscKernel_A_gets_A_times_B_9()
851 A2 = _mm256_broadcast_sd(W + 80); in PetscKernel_A_gets_A_times_B_9()
857 S2 = _mm256_fmadd_pd(A2, B0, S2); in PetscKernel_A_gets_A_times_B_9()
860 S5 = _mm256_fmadd_pd(A2, B1, S5); in PetscKernel_A_gets_A_times_B_9()
863 S8 = _mm256_fmadd_pd(A2, B2, S8); in PetscKernel_A_gets_A_times_B_9()
980 …__m256d A0, A1, A2, A3, A4, A5, A6, A7, A8, B0, B1, B2, B3, B4, B5, B6, B7, B8, C0, C1, C2, C3, C… in PetscKernel_A_gets_A_minus_B_times_C_9() local
985 A2 = _mm256_loadu_pd(A + 8); in PetscKernel_A_gets_A_minus_B_times_C_9()
1001 A2 = _mm256_fnmadd_pd(B2, C0, A2); in PetscKernel_A_gets_A_minus_B_times_C_9()
1017 A2 = _mm256_fnmadd_pd(B5, C3, A2); in PetscKernel_A_gets_A_minus_B_times_C_9()
1033 A2 = _mm256_fnmadd_pd(B8, C6, A2); in PetscKernel_A_gets_A_minus_B_times_C_9()
1049 A2 = _mm256_fnmadd_pd(B2, C0, A2); in PetscKernel_A_gets_A_minus_B_times_C_9()
1065 A2 = _mm256_fnmadd_pd(B5, C3, A2); in PetscKernel_A_gets_A_minus_B_times_C_9()
1081 A2 = _mm256_fnmadd_pd(B8, C6, A2); in PetscKernel_A_gets_A_minus_B_times_C_9()
1097 A2 = _mm256_fnmadd_pd(B2, C0, A2); in PetscKernel_A_gets_A_minus_B_times_C_9()
1113 A2 = _mm256_fnmadd_pd(B5, C3, A2); in PetscKernel_A_gets_A_minus_B_times_C_9()
1129 A2 = _mm256_fnmadd_pd(B8, C6, A2); in PetscKernel_A_gets_A_minus_B_times_C_9()
1139 _mm256_maskstore_pd(&A[8], _mm256_set_epi64x(0LL, 0LL, 0LL, 1LL << 63), A2); in PetscKernel_A_gets_A_minus_B_times_C_9()