Lines Matching refs:aval

32       vec_vals = _mm512_loadu_pd(aval); \
37 vec_vals = _mm256_loadu_pd(aval); \
325 const MatScalar *aval = a->val; in MatMult_SeqSELL() local
351 #pragma disjoint(*x, *y, *aval) in MatMult_SeqSELL()
361 PetscPrefetchBlock(aval, a->sliidx[i + 1] - a->sliidx[i], 0, PETSC_PREFETCH_HINT_T0); in MatMult_SeqSELL()
373 aval += 8; in MatMult_SeqSELL()
376 aval += 8; in MatMult_SeqSELL()
379 aval += 8; in MatMult_SeqSELL()
385 aval += 8; in MatMult_SeqSELL()
388 aval += 8; in MatMult_SeqSELL()
394 aval += 8; in MatMult_SeqSELL()
402 aval += 8; in MatMult_SeqSELL()
405 aval += 8; in MatMult_SeqSELL()
408 aval += 8; in MatMult_SeqSELL()
411 aval += 8; in MatMult_SeqSELL()
428 PetscPrefetchBlock(aval, a->sliidx[i + 1] - a->sliidx[i], 0, PETSC_PREFETCH_HINT_T0); in MatMult_SeqSELL()
437 for (j = 0; j < nnz_in_row; ++j) yval += aval[8 * j + r] * x[acolidx[8 * j + r]]; in MatMult_SeqSELL()
451 aval += 4; in MatMult_SeqSELL()
454 aval += 4; in MatMult_SeqSELL()
465 PetscPrefetchBlock(aval, a->sliidx[i + 1] - a->sliidx[i], 0, PETSC_PREFETCH_HINT_T0); in MatMult_SeqSELL()
477 for (j = 0; j < nnz_in_row; ++j) yval += aval[8 * j + r] * x[acolidx[8 * j + r]]; in MatMult_SeqSELL()
487 vec_vals = _mm256_loadu_pd(aval); in MatMult_SeqSELL()
496 aval += 4; in MatMult_SeqSELL()
498 vec_vals = _mm256_loadu_pd(aval); in MatMult_SeqSELL()
506 aval += 4; in MatMult_SeqSELL()
517 …for (k = a->sliidx[i] + j; k < a->sliidx[i + 1]; k += sliceheight) sum[j] += aval[k] * x[acolidx[k… in MatMult_SeqSELL()
540 const MatScalar *aval = a->val; in MatMultAdd_SeqSELL() local
561 #pragma disjoint(*x, *y, *aval) in MatMultAdd_SeqSELL()
575 PetscPrefetchBlock(aval, a->sliidx[i + 1] - a->sliidx[i], 0, PETSC_PREFETCH_HINT_T0); in MatMultAdd_SeqSELL()
592 aval += 8; in MatMultAdd_SeqSELL()
595 aval += 8; in MatMultAdd_SeqSELL()
598 aval += 8; in MatMultAdd_SeqSELL()
604 aval += 8; in MatMultAdd_SeqSELL()
607 aval += 8; in MatMultAdd_SeqSELL()
613 aval += 8; in MatMultAdd_SeqSELL()
621 aval += 8; in MatMultAdd_SeqSELL()
624 aval += 8; in MatMultAdd_SeqSELL()
627 aval += 8; in MatMultAdd_SeqSELL()
630 aval += 8; in MatMultAdd_SeqSELL()
646 PetscPrefetchBlock(aval, a->sliidx[i + 1] - a->sliidx[i], 0, PETSC_PREFETCH_HINT_T0); in MatMultAdd_SeqSELL()
654 for (j = 0; j < nnz_in_row; ++j) yval += aval[8 * j + r] * x[acolidx[8 * j + r]]; in MatMultAdd_SeqSELL()
665 vec_vals = _mm256_loadu_pd(aval); in MatMultAdd_SeqSELL()
675 aval += 4; in MatMultAdd_SeqSELL()
677 vec_vals = _mm256_loadu_pd(aval); in MatMultAdd_SeqSELL()
685 aval += 4; in MatMultAdd_SeqSELL()
696 …for (k = a->sliidx[i] + j; k < a->sliidx[i + 1]; k += sliceheight) sum[j] += aval[k] * x[acolidx[k… in MatMultAdd_SeqSELL()
718 const MatScalar *aval = a->val; in MatMultTransposeAdd_SeqSELL() local
723 #pragma disjoint(*x, *y, *aval) in MatMultTransposeAdd_SeqSELL()
741 …for (j = 0; j < nnz_in_row; ++j) y[acolidx[sliceheight * j + r]] += aval[sliceheight * j + r] * x[… in MatMultTransposeAdd_SeqSELL()
746 …for (j = a->sliidx[i] + r; j < a->sliidx[i + 1]; j += sliceheight) y[acolidx[j]] += aval[j] * x[sl… in MatMultTransposeAdd_SeqSELL()
1663 MatScalar *aval = a->val; in MatScale_SeqSELL() local
1669 PetscCallBLAS("BLASscal", BLASscal_(&size, &oalpha, aval, &one)); in MatScale_SeqSELL()