Home
last modified time | relevance | path

Searched refs:slice_id (Results 1 – 2 of 2) sorted by relevance

/petsc/src/mat/impls/sell/seq/seqhip/
H A Dsellhip.hip.cxx80 PetscInt i, row, slice_id, row_in_slice; in matmult_seqsell_basic_kernel() local
85 slice_id = row / sliceheight; in matmult_seqsell_basic_kernel()
88 …for (i = sliidx[slice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[… in matmult_seqsell_basic_kernel()
95 PetscInt i, row, slice_id, row_in_slice; in matmultadd_seqsell_basic_kernel() local
100 slice_id = row / sliceheight; in matmultadd_seqsell_basic_kernel()
103 …for (i = sliidx[slice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[… in matmultadd_seqsell_basic_kernel()
115 PetscInt i, row, slice_id = blockIdx.x; in matmult_seqsell_tiled_kernel9() local
122 row = slice_id * sliceheight + threadIdx.x % sliceheight; in matmult_seqsell_tiled_kernel9()
124 …for (i = sliidx[slice_id] + threadIdx.x + WARP_SIZE * threadIdx.y; i < sliidx[slice_id + 1]; i += … in matmult_seqsell_tiled_kernel9()
144 PetscInt i, row, slice_id = blockIdx.x; in matmultadd_seqsell_tiled_kernel9() local
[all …]
/petsc/src/mat/impls/sell/seq/seqcuda/
H A Dsellcuda.cu77 PetscInt i, row, slice_id, row_in_slice; in matmult_seqsell_basic_kernel() local
82 slice_id = row / sliceheight; in matmult_seqsell_basic_kernel()
85 …for (i = sliidx[slice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[… in matmult_seqsell_basic_kernel()
92 PetscInt i, row, slice_id, row_in_slice; in matmultadd_seqsell_basic_kernel() local
97 slice_id = row / sliceheight; in matmultadd_seqsell_basic_kernel()
100 …for (i = sliidx[slice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[… in matmultadd_seqsell_basic_kernel()
111 PetscInt i, row, slice_id = blockIdx.x; in matmult_seqsell_tiled_kernel9() local
118 row = slice_id * sliceheight + threadIdx.x % sliceheight; in matmult_seqsell_tiled_kernel9()
120 …for (i = sliidx[slice_id] + threadIdx.x + 32 * threadIdx.y; i < sliidx[slice_id + 1]; i += 32 * BL… in matmult_seqsell_tiled_kernel9()
140 PetscInt i, row, slice_id = blockIdx.x; in matmultadd_seqsell_tiled_kernel9() local
[all …]