Lines Matching refs:B1
707 …__m256d S0, S1, S2, S3, S4, S5, S6, S7, S8, B0, B1, B2, B6, B7, B8, A0, A1, A2, A3, A4, A5, A6, A… in PetscKernel_A_gets_A_times_B_9() local
725 B1 = _mm256_broadcast_sd(B + 9); in PetscKernel_A_gets_A_times_B_9()
730 S3 = _mm256_fmadd_pd(A0, B1, S3); in PetscKernel_A_gets_A_times_B_9()
731 S4 = _mm256_fmadd_pd(A1, B1, S4); in PetscKernel_A_gets_A_times_B_9()
732 S5 = _mm256_fmadd_pd(A2, B1, S5); in PetscKernel_A_gets_A_times_B_9()
757 B1 = _mm256_broadcast_sd(B + 11); in PetscKernel_A_gets_A_times_B_9()
762 S3 = _mm256_fmadd_pd(A6, B1, S3); in PetscKernel_A_gets_A_times_B_9()
763 S4 = _mm256_fmadd_pd(A7, B1, S4); in PetscKernel_A_gets_A_times_B_9()
764 S5 = _mm256_fmadd_pd(A8, B1, S5); in PetscKernel_A_gets_A_times_B_9()
789 B1 = _mm256_broadcast_sd(B + 13); in PetscKernel_A_gets_A_times_B_9()
794 S3 = _mm256_fmadd_pd(A3, B1, S3); in PetscKernel_A_gets_A_times_B_9()
795 S4 = _mm256_fmadd_pd(A4, B1, S4); in PetscKernel_A_gets_A_times_B_9()
796 S5 = _mm256_fmadd_pd(A5, B1, S5); in PetscKernel_A_gets_A_times_B_9()
821 B1 = _mm256_broadcast_sd(B + 15); in PetscKernel_A_gets_A_times_B_9()
826 S3 = _mm256_fmadd_pd(A3, B1, S3); in PetscKernel_A_gets_A_times_B_9()
827 S4 = _mm256_fmadd_pd(A4, B1, S4); in PetscKernel_A_gets_A_times_B_9()
828 S5 = _mm256_fmadd_pd(A5, B1, S5); in PetscKernel_A_gets_A_times_B_9()
853 B1 = _mm256_broadcast_sd(B + 17); in PetscKernel_A_gets_A_times_B_9()
858 S3 = _mm256_fmadd_pd(A0, B1, S3); in PetscKernel_A_gets_A_times_B_9()
859 S4 = _mm256_fmadd_pd(A1, B1, S4); in PetscKernel_A_gets_A_times_B_9()
860 S5 = _mm256_fmadd_pd(A2, B1, S5); in PetscKernel_A_gets_A_times_B_9()
980 …__m256d A0, A1, A2, A3, A4, A5, A6, A7, A8, B0, B1, B2, B3, B4, B5, B6, B7, B8, C0, C1, C2, C3, C… in PetscKernel_A_gets_A_minus_B_times_C_9() local
994 B1 = _mm256_loadu_pd(B + 4); in PetscKernel_A_gets_A_minus_B_times_C_9()
1000 A1 = _mm256_fnmadd_pd(B1, C0, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1003 A4 = _mm256_fnmadd_pd(B1, C1, A4); in PetscKernel_A_gets_A_minus_B_times_C_9()
1006 A7 = _mm256_fnmadd_pd(B1, C2, A7); in PetscKernel_A_gets_A_minus_B_times_C_9()
1042 B1 = _mm256_loadu_pd(B + 31); in PetscKernel_A_gets_A_minus_B_times_C_9()
1048 A1 = _mm256_fnmadd_pd(B1, C0, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1051 A4 = _mm256_fnmadd_pd(B1, C1, A4); in PetscKernel_A_gets_A_minus_B_times_C_9()
1054 A7 = _mm256_fnmadd_pd(B1, C2, A7); in PetscKernel_A_gets_A_minus_B_times_C_9()
1090 B1 = _mm256_loadu_pd(B + 58); in PetscKernel_A_gets_A_minus_B_times_C_9()
1096 A1 = _mm256_fnmadd_pd(B1, C0, A1); in PetscKernel_A_gets_A_minus_B_times_C_9()
1099 A4 = _mm256_fnmadd_pd(B1, C1, A4); in PetscKernel_A_gets_A_minus_B_times_C_9()
1102 A7 = _mm256_fnmadd_pd(B1, C2, A7); in PetscKernel_A_gets_A_minus_B_times_C_9()