Searched refs:vec_vals (Results 1 – 3 of 3) sorted by relevance
| /petsc/src/mat/impls/aij/seq/aijperm/ |
| H A D | aijperm.c | 285 __m512d vec_x, vec_y, vec_vals; in MatMult_SeqAIJPERM() local 382 vec_vals = _mm512_loadu_pd(&aa[ipos]); in MatMult_SeqAIJPERM() 384 vec_y = _mm512_fmadd_pd(vec_x, vec_vals, vec_y); in MatMult_SeqAIJPERM() 390 vec_vals = _mm512_loadu_pd(&aa[ipos]); in MatMult_SeqAIJPERM() 392 vec_y = _mm512_mask3_fmadd_pd(vec_x, vec_vals, vec_y, mask); in MatMult_SeqAIJPERM() 419 vec_vals = _mm512_i32gather_pd(vec_ipos, aa, _MM_SCALE_8); in MatMult_SeqAIJPERM() 421 vec_y = _mm512_fmadd_pd(vec_x, vec_vals, vec_y); in MatMult_SeqAIJPERM()
|
| /petsc/src/mat/impls/sell/seq/ |
| H A D | sell.c | 29 #define AVX512_Mult_Private(vec_idx, vec_x, vec_vals, vec_y) \ argument 32 vec_vals = _mm512_loadu_pd(aval); \ 34 vec_y = _mm512_fmadd_pd(vec_x, vec_vals, vec_y) 36 #define AVX2_Mult_Private(vec_idx, vec_x, vec_vals, vec_y) \ argument 37 vec_vals = _mm256_loadu_pd(aval); \ 40 vec_y = _mm256_fmadd_pd(vec_x, vec_vals, vec_y) 330 __m512d vec_x, vec_y, vec_vals; in MatMult_SeqSELL() local 337 __m256d vec_x, vec_y, vec_y2, vec_vals; in MatMult_SeqSELL() local 342 __m256d vec_x, vec_y, vec_y2, vec_vals; in MatMult_SeqSELL() local 371 AVX512_Mult_Private(vec_idx, vec_x, vec_vals, vec_y); in MatMult_SeqSELL() [all …]
|
| /petsc/src/mat/impls/aij/seq/ |
| H A D | aij.h | 626 __m512d vec_x, vec_y, vec_vals; in PetscSparseDensePlusDot_AVX512_Private() local 633 vec_vals = _mm512_loadu_pd(aa); in PetscSparseDensePlusDot_AVX512_Private() 635 vec_y = _mm512_fmadd_pd(vec_x, vec_vals, vec_y); in PetscSparseDensePlusDot_AVX512_Private() 645 vec_vals = _mm512_mask_loadu_pd(vec_vals, mask, aa); in PetscSparseDensePlusDot_AVX512_Private() 647 vec_y = _mm512_mask3_fmadd_pd(vec_x, vec_vals, vec_y, mask); in PetscSparseDensePlusDot_AVX512_Private()
|