Lines Matching refs:MatScalar
14 MatScalar *val; /* value array, device pointer */
48 …PetscCallHIP(hipMemcpy(hipstruct->val, a->val, a->sliidx[a->totalslices] * sizeof(MatScalar), hipM… in MatSeqSELLHIPCopyToGPU()
49 PetscCall(PetscLogCpuToGpu(a->sliidx[a->totalslices] * (sizeof(MatScalar)))); in MatSeqSELLHIPCopyToGPU()
69 …PetscCall(PetscLogCpuToGpu(a->sliidx[a->totalslices] * (sizeof(MatScalar) + sizeof(PetscInt)) + (a… in MatSeqSELLHIPCopyToGPU()
78 …el(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmult_seqsell_basic_kernel()
81 MatScalar sum; in matmult_seqsell_basic_kernel()
93 …el(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmultadd_seqsell_basic_kernel()
96 MatScalar sum; in matmultadd_seqsell_basic_kernel()
112 …l9(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmult_seqsell_tiled_kernel9()
114 __shared__ MatScalar shared[WARP_SIZE][BLOCKY]; in matmult_seqsell_tiled_kernel9()
141 …l9(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmultadd_seqsell_tiled_kernel9()
143 __shared__ MatScalar shared[WARP_SIZE][BLOCKY]; in matmultadd_seqsell_tiled_kernel9()
169 __device__ __forceinline__ static bool segment_scan(PetscInt flag[], MatScalar shared[], PetscScala… in segment_scan()
189 …chunks, const PetscInt *chunk_slice_map, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmult_seqsell_tiled_kernel8()
191 __shared__ MatScalar shared[BLOCKY * WARP_SIZE]; in matmult_seqsell_tiled_kernel8()
194 AtomicAdd<MatScalar> atomAdd; in matmult_seqsell_tiled_kernel8()
244 …chunks, const PetscInt *chunk_slice_map, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmultadd_seqsell_tiled_kernel8()
246 __shared__ MatScalar shared[BLOCKY * WARP_SIZE]; in matmultadd_seqsell_tiled_kernel8()
249 AtomicAdd<MatScalar> atomAdd; in matmultadd_seqsell_tiled_kernel8()
298 …l7(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmult_seqsell_tiled_kernel7()
313 …l7(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmultadd_seqsell_tiled_kernel7()
331 …l6(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in PETSC_PRAGMA_DIAGNOSTIC_IGNORED_END()
333 __shared__ MatScalar shared[32 * 16]; in PETSC_PRAGMA_DIAGNOSTIC_IGNORED_END()
359 …l5(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmult_seqsell_tiled_kernel5()
361 __shared__ MatScalar shared[32 * 16]; in matmult_seqsell_tiled_kernel5()
385 …l4(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmult_seqsell_tiled_kernel4()
387 __shared__ MatScalar shared[32 * 16]; in matmult_seqsell_tiled_kernel4()
409 …l3(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmult_seqsell_tiled_kernel3()
411 __shared__ MatScalar shared[32 * 16]; in matmult_seqsell_tiled_kernel3()
431 …l2(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmult_seqsell_tiled_kernel2()
433 __shared__ MatScalar shared[32 * 16]; in matmult_seqsell_tiled_kernel2()
451 …l6(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmultadd_seqsell_tiled_kernel6()
453 __shared__ MatScalar shared[32 * 16]; in matmultadd_seqsell_tiled_kernel6()
479 …l5(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmultadd_seqsell_tiled_kernel5()
481 __shared__ MatScalar shared[32 * 16]; in matmultadd_seqsell_tiled_kernel5()
505 …l4(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmultadd_seqsell_tiled_kernel4()
507 __shared__ MatScalar shared[32 * 16]; in matmultadd_seqsell_tiled_kernel4()
529 …l3(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmultadd_seqsell_tiled_kernel3()
531 __shared__ MatScalar shared[32 * 16]; in matmultadd_seqsell_tiled_kernel3()
551 …l2(PetscInt nrows, PetscInt sliceheight, const PetscInt *acolidx, const MatScalar *aval, const Pet… in matmultadd_seqsell_tiled_kernel2()
553 __shared__ MatScalar shared[32 * 16]; in matmultadd_seqsell_tiled_kernel2()
578 MatScalar *aval; in MatMult_SeqSELLHIP()
715 MatScalar *aval = hipstruct->val; in MatMultAdd_SeqSELLHIP()