| /libCEED/include/ceed/jit-source/cuda/ |
| H A D | cuda-atomic-add-fallback.h | 15 __device__ CeedScalar atomicAdd(CeedScalar *address, CeedScalar val) { in atomicAdd() function
|
| H A D | cuda-ref-restriction-at-points.h | 25 …atomicAdd(&v[ind + comp * RSTR_COMP_STRIDE], u[loc_node + comp * RSTR_ELEM_SIZE * RSTR_NUM_ELEM + … in AtPointsTranspose()
|
| H A D | cuda-gen-templates.h | 107 …for (CeedInt comp = 0; comp < NUM_COMP; comp++) atomicAdd(&d_v[ind + COMP_STRIDE * comp], r_v[comp… in WriteLVecStandard1d() 121 atomicAdd(&d_v[ind + COMP_STRIDE * target_comp], r_v[target_comp]); in WriteLVecStandard1d_Single() 229 …for (CeedInt comp = 0; comp < NUM_COMP; comp++) atomicAdd(&d_v[ind + COMP_STRIDE * comp], r_v[comp… in WriteLVecStandard2d() 245 atomicAdd(&d_v[ind + COMP_STRIDE * target_comp], r_v[target_comp]); in WriteLVecStandard2d_Single() 393 …for (CeedInt comp = 0; comp < NUM_COMP; comp++) atomicAdd(&d_v[ind + COMP_STRIDE * comp], r_v[z + … in WriteLVecStandard3d() 411 atomicAdd(&d_v[ind + COMP_STRIDE * target_comp], r_v[target_node_z + target_comp * P_1D]); in WriteLVecStandard3d_Single()
|
| H A D | cuda-ref-restriction-offset.h | 38 …atomicAdd(&v[ind + comp * RSTR_COMP_STRIDE], u[loc_node + comp * RSTR_ELEM_SIZE * RSTR_NUM_ELEM + … in OffsetTranspose()
|
| H A D | cuda-ref-restriction-oriented.h | 42 atomicAdd(&v[ind + comp * RSTR_COMP_STRIDE], in OrientedTranspose()
|
| H A D | cuda-ref-restriction-curl-oriented.h | 82 atomicAdd(&v[ind + comp * RSTR_COMP_STRIDE], value); in CurlOrientedTranspose() 140 atomicAdd(&v[ind + comp * RSTR_COMP_STRIDE], value); in CurlOrientedUnsignedTranspose()
|
| H A D | cuda-ref-basis-tensor-at-points.h | 181 …for (CeedInt j = 0; j < Q; j++) atomicAdd(&out[(a * Q + (j + p) % Q) * post + c], chebyshev_x[(j +… in InterpTransposeAtPoints() 371 …for (CeedInt j = 0; j < Q; j++) atomicAdd(&out[(a * Q + (j + p) % Q) * post + c], chebyshev_x[(j +… in GradTransposeAtPoints()
|
| /libCEED/include/ceed/jit-source/hip/ |
| H A D | hip-shared-basis-tensor-at-points-templates.h | 78 …atomicAdd(&data.slice[comp * Q_1D + (i + data.t_id_x) % Q_1D], chebyshev_x[(i + data.t_id_x) % Q_1… in InterpTransposeAtPoints1d() 125 …atomicAdd(&data.slice[comp * Q_1D + (i + data.t_id_x) % Q_1D], chebyshev_x[(i + data.t_id_x) % Q_1… in GradTransposeAtPoints1d() 198 …if (data.t_id_x < Q_1D && data.t_id_y < Q_1D) atomicAdd(&data.slice[jj + ii * Q_1D], chebyshev_x[j… in InterpTransposeAtPoints2d() 274 …if (data.t_id_x < Q_1D && data.t_id_y < Q_1D) atomicAdd(&data.slice[jj + ii * Q_1D], chebyshev_x[j… in GradTransposeAtPoints2d() 359 …if (data.t_id_x < Q_1D && data.t_id_y < Q_1D) atomicAdd(&data.slice[jj + ii * Q_1D], chebyshev_x[j… in InterpTransposeAtPoints3d() 458 …if (data.t_id_x < Q_1D && data.t_id_y < Q_1D) atomicAdd(&data.slice[jj + ii * Q_1D], chebyshev_x[j… in GradTransposeAtPoints3d()
|
| H A D | hip-ref-restriction-at-points.h | 25 …atomicAdd(&v[ind + comp * RSTR_COMP_STRIDE], u[loc_node + comp * RSTR_ELEM_SIZE * RSTR_NUM_ELEM + … in AtPointsTranspose()
|
| H A D | hip-gen-templates.h | 106 …for (CeedInt comp = 0; comp < NUM_COMP; comp++) atomicAdd(&d_v[ind + COMP_STRIDE * comp], r_v[comp… in WriteLVecStandard1d() 120 atomicAdd(&d_v[ind + COMP_STRIDE * target_comp], r_v[target_comp]); in WriteLVecStandard1d_Single() 227 …for (CeedInt comp = 0; comp < NUM_COMP; comp++) atomicAdd(&d_v[ind + COMP_STRIDE * comp], r_v[comp… in WriteLVecStandard2d() 243 atomicAdd(&d_v[ind + COMP_STRIDE * target_comp], r_v[target_comp]); in WriteLVecStandard2d_Single() 390 …for (CeedInt comp = 0; comp < NUM_COMP; comp++) atomicAdd(&d_v[ind + COMP_STRIDE * comp], r_v[z + … in WriteLVecStandard3d() 408 atomicAdd(&d_v[ind + COMP_STRIDE * target_comp], r_v[target_node_z + target_comp * P_1D]); in WriteLVecStandard3d_Single()
|
| H A D | hip-ref-restriction-offset.h | 38 …atomicAdd(&v[ind + comp * RSTR_COMP_STRIDE], u[loc_node + comp * RSTR_ELEM_SIZE * RSTR_NUM_ELEM + … in OffsetTranspose()
|
| H A D | hip-ref-restriction-oriented.h | 42 atomicAdd(&v[ind + comp * RSTR_COMP_STRIDE], in OrientedTranspose()
|
| H A D | hip-ref-restriction-curl-oriented.h | 82 atomicAdd(&v[ind + comp * RSTR_COMP_STRIDE], value); in CurlOrientedTranspose() 140 atomicAdd(&v[ind + comp * RSTR_COMP_STRIDE], value); in CurlOrientedUnsignedTranspose()
|
| H A D | hip-ref-basis-tensor-at-points.h | 181 …for (CeedInt j = 0; j < Q; j++) atomicAdd(&out[(a * Q + (j + p) % Q) * post + c], chebyshev_x[(j +… in InterpTransposeAtPoints() 371 …for (CeedInt j = 0; j < Q; j++) atomicAdd(&out[(a * Q + (j + p) % Q) * post + c], chebyshev_x[(j +… in GradTransposeAtPoints()
|
| /libCEED/ |
| H A D | README.md | 227 However, some libCEED backends use non-deterministic operations, such as `atomicAdd` for increased …
|