Searched refs:totalchunks (Results 1 – 4 of 4) sorted by relevance
| /petsc/src/mat/impls/sell/seq/seqhip/ |
| H A D | sellhip.hip.cxx | 21 PetscInt totalchunks; member 58 hipstruct->totalchunks = a->totalchunks; in MatSeqSELLHIPCopyToGPU() 67 …PetscCallHIP(hipMalloc((void **)&hipstruct->chunk_slice_map, a->totalchunks * sizeof(*hipstruct->c… in MatSeqSELLHIPCopyToGPU() 68 …PetscCallHIP(hipMemcpy(hipstruct->chunk_slice_map, a->chunk_slice_map, a->totalchunks * sizeof(*a-… in MatSeqSELLHIPCopyToGPU() 69 …s] * (sizeof(MatScalar) + sizeof(PetscInt)) + (a->totalslices + 1 + a->totalchunks) * sizeof(Petsc… in MatSeqSELLHIPCopyToGPU() 189 …etscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt totalchunks, const PetscInt… in matmult_seqsell_tiled_kernel8() argument 202 if (cid < totalchunks) { in matmult_seqsell_tiled_kernel8() 244 …etscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt totalchunks, const PetscInt… in matmultadd_seqsell_tiled_kernel8() argument 257 if (cid < totalchunks) { in matmultadd_seqsell_tiled_kernel8() 663 nchunks = hipstruct->totalchunks; in MatMult_SeqSELLHIP() [all …]
|
| /petsc/src/mat/impls/sell/seq/seqcuda/ |
| H A D | sellcuda.cu | 18 PetscInt totalchunks; member 55 cudastruct->totalchunks = a->totalchunks; in MatSeqSELLCUDACopyToGPU() 64 …PetscCallCUDA(cudaMalloc((void **)&cudastruct->chunk_slice_map, a->totalchunks * sizeof(*cudastruc… in MatSeqSELLCUDACopyToGPU() 65 …PetscCallCUDA(cudaMemcpy(cudastruct->chunk_slice_map, a->chunk_slice_map, a->totalchunks * sizeof(… in MatSeqSELLCUDACopyToGPU() 66 …s] * (sizeof(MatScalar) + sizeof(PetscInt)) + (a->totalslices + 1 + a->totalchunks) * sizeof(Petsc… in MatSeqSELLCUDACopyToGPU() 185 …etscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt totalchunks, const PetscInt… in matmult_seqsell_tiled_kernel8() argument 198 if (cid < totalchunks) { in matmult_seqsell_tiled_kernel8() 240 …etscInt nrows, PetscInt sliceheight, PetscInt chunksperblock, PetscInt totalchunks, const PetscInt… in matmultadd_seqsell_tiled_kernel8() argument 253 if (cid < totalchunks) { in matmultadd_seqsell_tiled_kernel8() 661 nchunks = cudastruct->totalchunks; in MatMult_SeqSELLCUDA() [all …]
|
| /petsc/src/mat/impls/sell/seq/ |
| H A D | sell.c | 1442 PetscInt totalchunks = 0; in MatAssemblyEnd_SeqSELL() local 1493 totalchunks = 1 + (a->sliidx[a->totalslices] - 1) / a->chunksize; in MatAssemblyEnd_SeqSELL() 1495 if (totalchunks != a->totalchunks) { in MatAssemblyEnd_SeqSELL() 1497 PetscCall(PetscMalloc1(totalchunks, &a->chunk_slice_map)); in MatAssemblyEnd_SeqSELL() 1498 a->totalchunks = totalchunks; in MatAssemblyEnd_SeqSELL() 1501 for (i = 0; i < totalchunks; i++) { in MatAssemblyEnd_SeqSELL()
|
| H A D | sell.h | 57 PetscInt totalchunks; /* total number of chunks, CUDA only */ \
|