Home
last modified time | relevance | path

Searched refs:chunksperblock (Results 1 – 2 of 2) sorted by relevance

/petsc/src/mat/impls/sell/seq/seqcuda/
H A Dsellcuda.cu17 PetscInt chunksperblock; member
185 …seqsell_tiled_kernel8(PetscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt tota… in matmult_seqsell_tiled_kernel8() argument
196 for (int iter = 0; iter < chunksperblock; iter++) { in matmult_seqsell_tiled_kernel8()
197 cid = blockIdx.x * chunksperblock + iter; /* chunk id */ in matmult_seqsell_tiled_kernel8()
217 …if (iter == chunksperblock - 1 || (cid + 2) * BLOCKY * 32 > sliidx[start_slice + 1]) { /* last ite… in matmult_seqsell_tiled_kernel8()
240 …seqsell_tiled_kernel8(PetscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt tota… in matmultadd_seqsell_tiled_kernel8() argument
251 for (int iter = 0; iter < chunksperblock; iter++) { in matmultadd_seqsell_tiled_kernel8()
252 cid = blockIdx.x * chunksperblock + iter; /* chunk id */ in matmultadd_seqsell_tiled_kernel8()
272 …if (iter == chunksperblock - 1 || (cid + 2) * BLOCKY * 32 > sliidx[start_slice + 1]) { /* last ite… in matmultadd_seqsell_tiled_kernel8()
579 PetscInt chunksperblock, nchunks, *chunk_slice_map; in MatMult_SeqSELLCUDA() local
[all …]
/petsc/src/mat/impls/sell/seq/seqhip/
H A Dsellhip.hip.cxx20 PetscInt chunksperblock; member
189 …seqsell_tiled_kernel8(PetscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt tota… in matmult_seqsell_tiled_kernel8() argument
200 for (int iter = 0; iter < chunksperblock; iter++) { in matmult_seqsell_tiled_kernel8()
201 cid = blockIdx.x * chunksperblock + iter; /* chunk id */ in matmult_seqsell_tiled_kernel8()
221 …if (iter == chunksperblock - 1 || (cid + 2) * BLOCKY * WARP_SIZE > sliidx[start_slice + 1]) { /* l… in matmult_seqsell_tiled_kernel8()
244 …seqsell_tiled_kernel8(PetscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt tota… in matmultadd_seqsell_tiled_kernel8() argument
255 for (int iter = 0; iter < chunksperblock; iter++) { in matmultadd_seqsell_tiled_kernel8()
256 cid = blockIdx.x * chunksperblock + iter; /* chunk id */ in matmultadd_seqsell_tiled_kernel8()
276 …if (iter == chunksperblock - 1 || (cid + 2) * BLOCKY * WARP_SIZE > sliidx[start_slice + 1]) { /* l… in matmultadd_seqsell_tiled_kernel8()
584 PetscInt chunksperblock, nchunks, *chunk_slice_map; in MatMult_SeqSELLHIP() local
[all …]