Lines Matching refs:nchunks

579   PetscInt  chunksperblock, nchunks, *chunk_slice_map;  in MatMult_SeqSELLCUDA()  local
661 nchunks = cudastruct->totalchunks; in MatMult_SeqSELLCUDA()
663 nblocks = 1 + (nchunks - 1) / chunksperblock; in MatMult_SeqSELLCUDA()
666 …kernel8<2><<<nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMult_SeqSELLCUDA()
668 …kernel8<4><<<nblocks, dim3(32, 4)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMult_SeqSELLCUDA()
670 …kernel8<8><<<nblocks, dim3(32, 8)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMult_SeqSELLCUDA()
672 …rnel8<16><<<nblocks, dim3(32, 16)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMult_SeqSELLCUDA()
674 …rnel8<32><<<nblocks, dim3(32, 32)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMult_SeqSELLCUDA()
676 …kernel8<2><<<nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMult_SeqSELLCUDA()
720 PetscInt chunksperblock, nchunks, *chunk_slice_map; in MatMultAdd_SeqSELLCUDA() local
756 nchunks = cudastruct->totalchunks; in MatMultAdd_SeqSELLCUDA()
759 nblocks = 1 + (nchunks - 1) / chunksperblock; in MatMultAdd_SeqSELLCUDA()
762 …kernel8<2><<<nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
764 …kernel8<4><<<nblocks, dim3(32, 4)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
766 …kernel8<8><<<nblocks, dim3(32, 8)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
768 …rnel8<16><<<nblocks, dim3(32, 16)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
770 …rnel8<32><<<nblocks, dim3(32, 32)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
772 …kernel8<2><<<nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
821 nchunks = cudastruct->totalchunks; in MatMultAdd_SeqSELLCUDA()
824 nblocks = 1 + (nchunks - 1) / chunksperblock; in MatMultAdd_SeqSELLCUDA()
827 …kernel8<2><<<nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
829 …kernel8<4><<<nblocks, dim3(32, 4)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
831 …kernel8<8><<<nblocks, dim3(32, 8)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
833 …rnel8<16><<<nblocks, dim3(32, 16)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
835 …rnel8<32><<<nblocks, dim3(32, 32)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()
837 …kernel8<2><<<nblocks, dim3(32, 2)>>>(nrows, sliceheight, chunksperblock, nchunks, chunk_slice_map,… in MatMultAdd_SeqSELLCUDA()