Home
last modified time | relevance | path

Searched refs:totalchunks (Results 1 – 4 of 4) sorted by relevance

/petsc/src/mat/impls/sell/seq/seqhip/
H A Dsellhip.hip.cxx21 PetscInt totalchunks; member
58 hipstruct->totalchunks = a->totalchunks; in MatSeqSELLHIPCopyToGPU()
67 …PetscCallHIP(hipMalloc((void **)&hipstruct->chunk_slice_map, a->totalchunks * sizeof(*hipstruct->c… in MatSeqSELLHIPCopyToGPU()
68 …PetscCallHIP(hipMemcpy(hipstruct->chunk_slice_map, a->chunk_slice_map, a->totalchunks * sizeof(*a-… in MatSeqSELLHIPCopyToGPU()
69 …s] * (sizeof(MatScalar) + sizeof(PetscInt)) + (a->totalslices + 1 + a->totalchunks) * sizeof(Petsc… in MatSeqSELLHIPCopyToGPU()
189 …etscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt totalchunks, const PetscInt… in matmult_seqsell_tiled_kernel8() argument
202 if (cid < totalchunks) { in matmult_seqsell_tiled_kernel8()
244 …etscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt totalchunks, const PetscInt… in matmultadd_seqsell_tiled_kernel8() argument
257 if (cid < totalchunks) { in matmultadd_seqsell_tiled_kernel8()
663 nchunks = hipstruct->totalchunks; in MatMult_SeqSELLHIP()
[all …]
/petsc/src/mat/impls/sell/seq/seqcuda/
H A Dsellcuda.cu18 PetscInt totalchunks; member
55 cudastruct->totalchunks = a->totalchunks; in MatSeqSELLCUDACopyToGPU()
64 …PetscCallCUDA(cudaMalloc((void **)&cudastruct->chunk_slice_map, a->totalchunks * sizeof(*cudastruc… in MatSeqSELLCUDACopyToGPU()
65 …PetscCallCUDA(cudaMemcpy(cudastruct->chunk_slice_map, a->chunk_slice_map, a->totalchunks * sizeof(… in MatSeqSELLCUDACopyToGPU()
66 …s] * (sizeof(MatScalar) + sizeof(PetscInt)) + (a->totalslices + 1 + a->totalchunks) * sizeof(Petsc… in MatSeqSELLCUDACopyToGPU()
185 …etscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt totalchunks, const PetscInt… in matmult_seqsell_tiled_kernel8() argument
198 if (cid < totalchunks) { in matmult_seqsell_tiled_kernel8()
240 …etscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt totalchunks, const PetscInt… in matmultadd_seqsell_tiled_kernel8() argument
253 if (cid < totalchunks) { in matmultadd_seqsell_tiled_kernel8()
661 nchunks = cudastruct->totalchunks; in MatMult_SeqSELLCUDA()
[all …]
/petsc/src/mat/impls/sell/seq/
H A Dsell.c1442 PetscInt totalchunks = 0; in MatAssemblyEnd_SeqSELL() local
1493 totalchunks = 1 + (a->sliidx[a->totalslices] - 1) / a->chunksize; in MatAssemblyEnd_SeqSELL()
1495 if (totalchunks != a->totalchunks) { in MatAssemblyEnd_SeqSELL()
1497 PetscCall(PetscMalloc1(totalchunks, &a->chunk_slice_map)); in MatAssemblyEnd_SeqSELL()
1498 a->totalchunks = totalchunks; in MatAssemblyEnd_SeqSELL()
1501 for (i = 0; i < totalchunks; i++) { in MatAssemblyEnd_SeqSELL()
H A Dsell.h57 PetscInt totalchunks; /* total number of chunks, CUDA only */ \