| /petsc/src/mat/impls/sell/seq/seqcuda/ |
| H A D | sellcuda.cu | 75 …nt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const PetscInt *sl… in matmult_seqsell_basic_kernel() argument 85 …ice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[i] * x[acolidx[i]]; in matmult_seqsell_basic_kernel() 90 …nt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const PetscInt *sl… in matmultadd_seqsell_basic_kernel() argument 100 …ice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[i] * x[acolidx[i]]; in matmultadd_seqsell_basic_kernel() 108 …nt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const PetscInt *sl… in matmult_seqsell_tiled_kernel9() argument 120 …Idx.x + 32 * threadIdx.y; i < sliidx[slice_id + 1]; i += 32 * BLOCKY) t += aval[i] * x[acolidx[i]]; in matmult_seqsell_tiled_kernel9() 137 …nt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const PetscInt *sl… in matmultadd_seqsell_tiled_kernel9() argument 149 …Idx.x + 32 * threadIdx.y; i < sliidx[slice_id + 1]; i += 32 * BLOCKY) t += aval[i] * x[acolidx[i]]; in matmultadd_seqsell_tiled_kernel9() 185 …onst PetscInt *chunk_slice_map, const PetscInt *acolidx, const MatScalar *aval, const PetscInt *sl… in matmult_seqsell_tiled_kernel8() argument 209 if (row < nrows && gid < totalentries) t = aval[gid] * x[acolidx[gid]]; in matmult_seqsell_tiled_kernel8() [all …]
|
| /petsc/src/mat/impls/sell/seq/seqhip/ |
| H A D | sellhip.hip.cxx | 78 …nt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const PetscInt *sl… in matmult_seqsell_basic_kernel() argument 88 …ice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[i] * x[acolidx[i]]; in matmult_seqsell_basic_kernel() 93 …nt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const PetscInt *sl… in matmultadd_seqsell_basic_kernel() argument 103 …ice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[i] * x[acolidx[i]]; in matmultadd_seqsell_basic_kernel() 112 …nt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const PetscInt *sl… in matmult_seqsell_tiled_kernel9() argument 124 …IZE * threadIdx.y; i < sliidx[slice_id + 1]; i += WARP_SIZE * BLOCKY) t += aval[i] * x[acolidx[i]]; in matmult_seqsell_tiled_kernel9() 141 …nt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const PetscInt *sl… in matmultadd_seqsell_tiled_kernel9() argument 153 …IZE * threadIdx.y; i < sliidx[slice_id + 1]; i += WARP_SIZE * BLOCKY) t += aval[i] * x[acolidx[i]]; in matmultadd_seqsell_tiled_kernel9() 189 …onst PetscInt *chunk_slice_map, const PetscInt *acolidx, const MatScalar *aval, const PetscInt *sl… in matmult_seqsell_tiled_kernel8() argument 213 if (row < nrows && gid < totalentries) t = aval[gid] * x[acolidx[gid]]; in matmult_seqsell_tiled_kernel8() [all …]
|
| /petsc/src/mat/impls/sell/seq/ |
| H A D | sell.c | 32 vec_vals = _mm512_loadu_pd(aval); \ 37 vec_vals = _mm256_loadu_pd(aval); \ 325 const MatScalar *aval = a->val; in MatMult_SeqSELL() local 351 #pragma disjoint(*x, *y, *aval) in MatMult_SeqSELL() 361 PetscPrefetchBlock(aval, a->sliidx[i + 1] - a->sliidx[i], 0, PETSC_PREFETCH_HINT_T0); in MatMult_SeqSELL() 373 aval += 8; in MatMult_SeqSELL() 376 aval += 8; in MatMult_SeqSELL() 379 aval += 8; in MatMult_SeqSELL() 385 aval += 8; in MatMult_SeqSELL() 388 aval += 8; in MatMult_SeqSELL() [all …]
|
| /petsc/src/mat/impls/kaij/ |
| H A D | kaij.c | 739 PetscScalar *diag, aval, *v_work; in MatInvertBlockDiagonal_SeqKAIJ() local 764 aval = 0; in MatInvertBlockDiagonal_SeqKAIJ() 766 if (idx[j] == i) aval = v[j]; in MatInvertBlockDiagonal_SeqKAIJ() 767 for (j = 0; j < dof; j++) diag[j + dof * j] += aval; in MatInvertBlockDiagonal_SeqKAIJ() 769 aval = 0; in MatInvertBlockDiagonal_SeqKAIJ() 771 if (idx[j] == i) aval = v[j]; in MatInvertBlockDiagonal_SeqKAIJ() 772 for (j = 0; j < dof2; j++) diag[j] += aval * T[j]; in MatInvertBlockDiagonal_SeqKAIJ()
|
| /petsc/src/mat/impls/sell/mpi/ |
| H A D | mpisell.c | 604 MatScalar *aval; in MatView_MPISELL_ASCIIorDraworSocket() local 621 aval = Aloc->val; in MatView_MPISELL_ASCIIorDraworSocket() 628 PetscCall(MatSetValues(A, 1, &row, 1, &col, aval, INSERT_VALUES)); in MatView_MPISELL_ASCIIorDraworSocket() 630 aval++; in MatView_MPISELL_ASCIIorDraworSocket() 638 aval = Aloc->val; in MatView_MPISELL_ASCIIorDraworSocket() 645 PetscCall(MatSetValues(A, 1, &row, 1, &col, aval, INSERT_VALUES)); in MatView_MPISELL_ASCIIorDraworSocket() 647 aval++; in MatView_MPISELL_ASCIIorDraworSocket()
|
| /petsc/src/mat/impls/baij/seq/ |
| H A D | baijfact.c | 893 MatScalar *rtmp, *ba = b->a, *aa = a->a, dk, uikdi, *aval, *bval; in MatCholeskyFactorNumeric_SeqBAIJ_N_NaturalOrdering() local 915 aval = aa + ai[k]; in MatCholeskyFactorNumeric_SeqBAIJ_N_NaturalOrdering() 920 aval++; in MatCholeskyFactorNumeric_SeqBAIJ_N_NaturalOrdering() 922 rtmp[*acol++] = *aval++; in MatCholeskyFactorNumeric_SeqBAIJ_N_NaturalOrdering()
|
| /petsc/src/mat/impls/sbaij/seq/ |
| H A D | sbaijfact.c | 1505 MatScalar *rtmp, *ba = b->a, *aa = a->a, dk, uikdi, *aval, *bval; in MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace() local 1537 aval = aa + ai[k]; in MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace() 1540 rtmp[*acol++] = *aval++; in MatCholeskyFactorNumeric_SeqSBAIJ_1_NaturalOrdering_inplace()
|
| /petsc/src/mat/impls/aij/seq/ |
| H A D | matmatmult.c | 1304 MatScalar *aa = a->a, *aval, *ba = b->a, *bval, *ca, *cval; in MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ() local 1341 aval = PetscSafePointerPlusOffset(aa, ai[i]); in MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ() 1360 cval[j] += aval[nexta] * bval[nextb]; in MatMatTransposeMultNumeric_SeqAIJ_SeqAIJ()
|
| /petsc/src/binding/petsc4py/src/petsc4py/PETSc/ |
| H A D | Vec.pyx | 2414 cdef PetscScalar aval = asScalar(alpha) 2415 CHKERR(VecISSet(self.vec, idx.iset, aval))
|