Lines Matching refs:A1

707 …__m256d  S0, S1, S2, S3, S4, S5, S6, S7, S8, B0, B1, B2, B6, B7, B8, A0, A1, A2, A3, A4, A5, A6, A…  in PetscKernel_A_gets_A_times_B_9()  local
722 A1 = _mm256_loadu_pd(W + 4); in PetscKernel_A_gets_A_times_B_9()
728 S1 = _mm256_fmadd_pd(A1, B0, S1); in PetscKernel_A_gets_A_times_B_9()
731 S4 = _mm256_fmadd_pd(A1, B1, S4); in PetscKernel_A_gets_A_times_B_9()
734 S7 = _mm256_fmadd_pd(A1, B2, S7); in PetscKernel_A_gets_A_times_B_9()
770 A1 = _mm256_loadu_pd(W + 31); in PetscKernel_A_gets_A_times_B_9()
776 S1 = _mm256_fmadd_pd(A1, B6, S1); in PetscKernel_A_gets_A_times_B_9()
779 S4 = _mm256_fmadd_pd(A1, B7, S4); in PetscKernel_A_gets_A_times_B_9()
782 S7 = _mm256_fmadd_pd(A1, B8, S7); in PetscKernel_A_gets_A_times_B_9()
802 A1 = _mm256_loadu_pd(W + 49); in PetscKernel_A_gets_A_times_B_9()
808 S1 = _mm256_fmadd_pd(A1, B6, S1); in PetscKernel_A_gets_A_times_B_9()
811 S4 = _mm256_fmadd_pd(A1, B7, S4); in PetscKernel_A_gets_A_times_B_9()
814 S7 = _mm256_fmadd_pd(A1, B8, S7); in PetscKernel_A_gets_A_times_B_9()
850 A1 = _mm256_loadu_pd(W + 76); in PetscKernel_A_gets_A_times_B_9()
856 S1 = _mm256_fmadd_pd(A1, B0, S1); in PetscKernel_A_gets_A_times_B_9()
859 S4 = _mm256_fmadd_pd(A1, B1, S4); in PetscKernel_A_gets_A_times_B_9()
862 S7 = _mm256_fmadd_pd(A1, B2, S7); in PetscKernel_A_gets_A_times_B_9()
980 …__m256d A0, A1, A2, A3, A4, A5, A6, A7, A8, B0, B1, B2, B3, B4, B5, B6, B7, B8, C0, C1, C2, C3, C… in PetscKernel_A_gets_A_minus_B_times_C_9() local
984 A1 = _mm256_loadu_pd(A + 4); in PetscKernel_A_gets_A_minus_B_times_C_9()
1000 A1 = _mm256_fnmadd_pd(B1, C0, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1016 A1 = _mm256_fnmadd_pd(B4, C3, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1032 A1 = _mm256_fnmadd_pd(B7, C6, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1048 A1 = _mm256_fnmadd_pd(B1, C0, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1064 A1 = _mm256_fnmadd_pd(B4, C3, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1080 A1 = _mm256_fnmadd_pd(B7, C6, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1096 A1 = _mm256_fnmadd_pd(B1, C0, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1112 A1 = _mm256_fnmadd_pd(B4, C3, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1128 A1 = _mm256_fnmadd_pd(B7, C6, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1138 _mm256_storeu_pd(&A[4], A1); in PetscKernel_A_gets_A_minus_B_times_C_9()