Lines Matching refs:B0
707 …__m256d S0, S1, S2, S3, S4, S5, S6, S7, S8, B0, B1, B2, B6, B7, B8, A0, A1, A2, A3, A4, A5, A6, A… in PetscKernel_A_gets_A_times_B_9() local
724 B0 = _mm256_broadcast_sd(B + 0); in PetscKernel_A_gets_A_times_B_9()
727 S0 = _mm256_fmadd_pd(A0, B0, S0); in PetscKernel_A_gets_A_times_B_9()
728 S1 = _mm256_fmadd_pd(A1, B0, S1); in PetscKernel_A_gets_A_times_B_9()
729 S2 = _mm256_fmadd_pd(A2, B0, S2); in PetscKernel_A_gets_A_times_B_9()
756 B0 = _mm256_broadcast_sd(B + 2); in PetscKernel_A_gets_A_times_B_9()
759 S0 = _mm256_fmadd_pd(A6, B0, S0); in PetscKernel_A_gets_A_times_B_9()
760 S1 = _mm256_fmadd_pd(A7, B0, S1); in PetscKernel_A_gets_A_times_B_9()
761 S2 = _mm256_fmadd_pd(A8, B0, S2); in PetscKernel_A_gets_A_times_B_9()
788 B0 = _mm256_broadcast_sd(B + 4); in PetscKernel_A_gets_A_times_B_9()
791 S0 = _mm256_fmadd_pd(A3, B0, S0); in PetscKernel_A_gets_A_times_B_9()
792 S1 = _mm256_fmadd_pd(A4, B0, S1); in PetscKernel_A_gets_A_times_B_9()
793 S2 = _mm256_fmadd_pd(A5, B0, S2); in PetscKernel_A_gets_A_times_B_9()
820 B0 = _mm256_broadcast_sd(B + 6); in PetscKernel_A_gets_A_times_B_9()
823 S0 = _mm256_fmadd_pd(A3, B0, S0); in PetscKernel_A_gets_A_times_B_9()
824 S1 = _mm256_fmadd_pd(A4, B0, S1); in PetscKernel_A_gets_A_times_B_9()
825 S2 = _mm256_fmadd_pd(A5, B0, S2); in PetscKernel_A_gets_A_times_B_9()
852 B0 = _mm256_broadcast_sd(B + 8); in PetscKernel_A_gets_A_times_B_9()
855 S0 = _mm256_fmadd_pd(A0, B0, S0); in PetscKernel_A_gets_A_times_B_9()
856 S1 = _mm256_fmadd_pd(A1, B0, S1); in PetscKernel_A_gets_A_times_B_9()
857 S2 = _mm256_fmadd_pd(A2, B0, S2); in PetscKernel_A_gets_A_times_B_9()
980 …__m256d A0, A1, A2, A3, A4, A5, A6, A7, A8, B0, B1, B2, B3, B4, B5, B6, B7, B8, C0, C1, C2, C3, C… in PetscKernel_A_gets_A_minus_B_times_C_9() local
993 B0 = _mm256_loadu_pd(B + 0); in PetscKernel_A_gets_A_minus_B_times_C_9()
999 A0 = _mm256_fnmadd_pd(B0, C0, A0); in PetscKernel_A_gets_A_minus_B_times_C_9()
1002 A3 = _mm256_fnmadd_pd(B0, C1, A3); in PetscKernel_A_gets_A_minus_B_times_C_9()
1005 A6 = _mm256_fnmadd_pd(B0, C2, A6); in PetscKernel_A_gets_A_minus_B_times_C_9()
1041 B0 = _mm256_loadu_pd(B + 27); in PetscKernel_A_gets_A_minus_B_times_C_9()
1047 A0 = _mm256_fnmadd_pd(B0, C0, A0); in PetscKernel_A_gets_A_minus_B_times_C_9()
1050 A3 = _mm256_fnmadd_pd(B0, C1, A3); in PetscKernel_A_gets_A_minus_B_times_C_9()
1053 A6 = _mm256_fnmadd_pd(B0, C2, A6); in PetscKernel_A_gets_A_minus_B_times_C_9()
1089 B0 = _mm256_loadu_pd(B + 54); in PetscKernel_A_gets_A_minus_B_times_C_9()
1095 A0 = _mm256_fnmadd_pd(B0, C0, A0); in PetscKernel_A_gets_A_minus_B_times_C_9()
1098 A3 = _mm256_fnmadd_pd(B0, C1, A3); in PetscKernel_A_gets_A_minus_B_times_C_9()
1101 A6 = _mm256_fnmadd_pd(B0, C2, A6); in PetscKernel_A_gets_A_minus_B_times_C_9()