Searched refs:slice_id (Results 1 – 2 of 2) sorted by relevance
| /petsc/src/mat/impls/sell/seq/seqhip/ |
| H A D | sellhip.hip.cxx | 80 PetscInt i, row, slice_id, row_in_slice; in matmult_seqsell_basic_kernel() local 85 slice_id = row / sliceheight; in matmult_seqsell_basic_kernel() 88 …for (i = sliidx[slice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[… in matmult_seqsell_basic_kernel() 95 PetscInt i, row, slice_id, row_in_slice; in matmultadd_seqsell_basic_kernel() local 100 slice_id = row / sliceheight; in matmultadd_seqsell_basic_kernel() 103 …for (i = sliidx[slice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[… in matmultadd_seqsell_basic_kernel() 115 PetscInt i, row, slice_id = blockIdx.x; in matmult_seqsell_tiled_kernel9() local 122 row = slice_id * sliceheight + threadIdx.x % sliceheight; in matmult_seqsell_tiled_kernel9() 124 …for (i = sliidx[slice_id] + threadIdx.x + WARP_SIZE * threadIdx.y; i < sliidx[slice_id + 1]; i += … in matmult_seqsell_tiled_kernel9() 144 PetscInt i, row, slice_id = blockIdx.x; in matmultadd_seqsell_tiled_kernel9() local [all …]
|
| /petsc/src/mat/impls/sell/seq/seqcuda/ |
| H A D | sellcuda.cu | 77 PetscInt i, row, slice_id, row_in_slice; in matmult_seqsell_basic_kernel() local 82 slice_id = row / sliceheight; in matmult_seqsell_basic_kernel() 85 …for (i = sliidx[slice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[… in matmult_seqsell_basic_kernel() 92 PetscInt i, row, slice_id, row_in_slice; in matmultadd_seqsell_basic_kernel() local 97 slice_id = row / sliceheight; in matmultadd_seqsell_basic_kernel() 100 …for (i = sliidx[slice_id] + row_in_slice; i < sliidx[slice_id + 1]; i += sliceheight) sum += aval[… in matmultadd_seqsell_basic_kernel() 111 PetscInt i, row, slice_id = blockIdx.x; in matmult_seqsell_tiled_kernel9() local 118 row = slice_id * sliceheight + threadIdx.x % sliceheight; in matmult_seqsell_tiled_kernel9() 120 …for (i = sliidx[slice_id] + threadIdx.x + 32 * threadIdx.y; i < sliidx[slice_id + 1]; i += 32 * BL… in matmult_seqsell_tiled_kernel9() 140 PetscInt i, row, slice_id = blockIdx.x; in matmultadd_seqsell_tiled_kernel9() local [all …]
|