#pragma once #if defined(__GNUC__) || defined(__clang__) #pragma GCC diagnostic ignored "-Wconversion" #endif /* Author: Henry M. Tufo III e-mail: hmt@cs.brown.edu snail-mail: Division of Applied Mathematics Brown University Providence, RI 02912 Last Modification: 6.21.97 File Description: */ #include #include #define X 0 #define Y 1 #define Z 2 #define XY 3 #define XZ 4 #define YZ 5 #define THRESH 0.2 #define N_HALF 4096 #define PRIV_BUF_SZ 45 /*4096 8192 32768 65536 1048576 */ #define MAX_MSG_BUF 32768 #define FULL 2 #define PARTIAL 1 #define NONE 0 #define BYTE 8 #define BIT_0 0x1 #define BIT_1 0x2 #define BIT_2 0x4 #define BIT_3 0x8 #define BIT_4 0x10 #define BIT_5 0x20 #define BIT_6 0x40 #define BIT_7 0x80 #define TOP_BIT PETSC_INT_MIN #define C 0 #define MAX_VEC 1674 #define FORMAT 30 #define MAX_COL_LEN 100 #define MAX_LINE FORMAT *MAX_COL_LEN #define DELIM " \n \t" #define LINE 12 #define C_LINE 80 #define UT 5 /* dump upper 1/2 */ #define LT 6 /* dump lower 1/2 */ #define SYMM 8 /* we assume symm and dump upper 1/2 */ #define NON_SYMM 9 #define ROW 10 #define COL 11 #define EPS 1.0e-14 #define EPS2 1.0e-07 #define MPI 1 #define NX 2 #define SWAP(a, b) \ do { \ temp = (a); \ (a) = (b); \ (b) = temp; \ } while (0) #define P_SWAP(a, b) \ do { \ ptr = (a); \ (a) = (b); \ (b) = ptr; \ } while (0) #define MAX_FABS(x, y) (PetscAbsScalar(x) > PetscAbsScalar(y)) ? ((PetscScalar)x) : ((PetscScalar)y) #define MIN_FABS(x, y) (PetscAbsScalar(x) < PetscAbsScalar(y)) ? ((PetscScalar)x) : ((PetscScalar)y) /* specer's existence ... can be done w/MAX_ABS */ #define EXISTS(x, y) ((x) == 0.0) ? (y) : (x) #define MULT_NEG_ONE(a) (a) *= -1; #define NEG(a) (a) |= BIT_31; #define POS(a) (a) &= INT_MAX; /* Author: Henry M. Tufo III e-mail: hmt@cs.brown.edu snail-mail: Division of Applied Mathematics Brown University Providence, RI 02912 Last Modification: 6.21.97 */ typedef PetscErrorCode (*vfp)(void *, void *, PetscInt, ...); typedef PetscErrorCode (*rbfp)(PetscScalar *, PetscScalar *, PetscInt); typedef PetscInt (*bfp)(void *, void *, PetscInt *, MPI_Datatype *); /* Author: Henry M. Tufo III e-mail: hmt@cs.brown.edu snail-mail: Division of Applied Mathematics Brown University Providence, RI 02912 Last Modification: 6.21.97 */ PETSC_INTERN PetscMPIInt PCTFS_my_id; PETSC_INTERN PetscMPIInt PCTFS_num_nodes; PETSC_INTERN PetscMPIInt PCTFS_floor_num_nodes; PETSC_INTERN PetscMPIInt PCTFS_i_log2_num_nodes; PETSC_INTERN PetscErrorCode PCTFS_giop(PetscInt *, PetscInt *, PetscInt, PetscInt *); PETSC_INTERN PetscErrorCode PCTFS_grop(PetscScalar *, PetscScalar *, PetscInt, PetscInt *); PETSC_INTERN PetscErrorCode PCTFS_comm_init(void); PETSC_INTERN PetscErrorCode PCTFS_giop_hc(PetscInt *, PetscInt *, PetscInt, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_grop_hc(PetscScalar *, PetscScalar *, PetscInt, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ssgl_radd(PetscScalar *, PetscScalar *, PetscInt, PetscInt *); #define MSGTAG0 101 #define MSGTAG1 1001 #define MSGTAG2 76207 #define MSGTAG3 100001 #define MSGTAG4 163841 #define MSGTAG5 249439 #define MSGTAG6 10000001 #define NON_UNIFORM 0 #define GL_MAX 1 #define GL_MIN 2 #define GL_MULT 3 #define GL_ADD 4 #define GL_B_XOR 5 #define GL_B_OR 6 #define GL_B_AND 7 #define GL_L_XOR 8 #define GL_L_OR 9 #define GL_L_AND 10 #define GL_MAX_ABS 11 #define GL_MIN_ABS 12 #define GL_EXISTS 13 PETSC_INTERN PetscInt *PCTFS_ivec_copy(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_zero(PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_set(PetscInt *, PetscInt, PetscInt); PETSC_INTERN PetscInt PCTFS_ivec_lb(PetscInt *, PetscInt); PETSC_INTERN PetscInt PCTFS_ivec_ub(PetscInt *, PetscInt); PETSC_INTERN PetscInt PCTFS_ivec_sum(PetscInt *, PetscInt); PETSC_INTERN vfp PCTFS_ivec_fct_addr(PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_non_uniform(PetscInt *, PetscInt *, PetscInt, ...); PETSC_INTERN PetscErrorCode PCTFS_ivec_max(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_min(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_mult(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_add(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_xor(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_or(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_and(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_lxor(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_lor(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_land(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_and3(PetscInt *, PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_sort_companion(PetscInt *, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_sort(PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_SMI_sort(void *, void *, PetscInt, PetscInt); PETSC_INTERN PetscInt PCTFS_ivec_binary_search(PetscInt, PetscInt *, PetscInt); PETSC_INTERN PetscInt PCTFS_ivec_linear_search(PetscInt, PetscInt *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_ivec_sort_companion_hack(PetscInt *, PetscInt **, PetscInt); #define SORT_INTEGER 1 #define SORT_INT_PTR 2 PETSC_INTERN PetscErrorCode PCTFS_rvec_zero(PetscScalar *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_rvec_one(PetscScalar *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_rvec_set(PetscScalar *, PetscScalar, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_rvec_copy(PetscScalar *, PetscScalar *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_rvec_scale(PetscScalar *, PetscScalar, PetscInt); PETSC_INTERN vfp PCTFS_rvec_fct_addr(PetscInt); PETSC_INTERN PetscErrorCode PCTFS_rvec_add(PetscScalar *, PetscScalar *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_rvec_mult(PetscScalar *, PetscScalar *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_rvec_max(PetscScalar *, PetscScalar *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_rvec_max_abs(PetscScalar *, PetscScalar *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_rvec_min(PetscScalar *, PetscScalar *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_rvec_min_abs(PetscScalar *, PetscScalar *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_vec_exists(PetscScalar *, PetscScalar *, PetscInt); /* Author: Henry M. Tufo III e-mail: hmt@cs.brown.edu snail-mail: Division of Applied Mathematics Brown University Providence, RI 02912 Last Modification: 6.21.97 */ typedef struct gather_scatter_id *PCTFS_gs_ADT; PETSC_INTERN PCTFS_gs_ADT PCTFS_gs_init(PetscInt *, PetscInt, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_gs_gop_vec(PCTFS_gs_ADT, PetscScalar *, const char *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_gs_gop_hc(PCTFS_gs_ADT, PetscScalar *, const char *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_gs_free(PCTFS_gs_ADT); PETSC_INTERN PetscErrorCode PCTFS_gs_init_msg_buf_sz(PetscInt); PETSC_INTERN PetscErrorCode PCTFS_gs_init_vec_sz(PetscInt); /* Module Name: xxt Module Info: need xxt.{c,h} gs.{c,h} comm.{c,h} ivec.{c,h} error.{c,h} author: Henry M. Tufo III e-mail: hmt@asci.uchicago.edu contact: +--------------------------------+--------------------------------+ |MCS Division - Building 221 |Department of Computer Science | |Argonne National Laboratory |Ryerson 152 | |9700 S. Cass Avenue |The University of Chicago | |Argonne, IL 60439 |Chicago, IL 60637 | |(630) 252-5354/5986 ph/fx |(773) 702-6019/8487 ph/fx | +--------------------------------+--------------------------------+ Last Modification: 3.20.01 */ typedef struct xxt_CDT *xxt_ADT; /* Function: XXT_new() Return: ADT ptr or NULL upon failure. Description: This function allocates and returns an xxt handle Usage: xxt_handle = xxt_new(); */ PETSC_INTERN xxt_ADT XXT_new(void); /* Function: XXT_free() Input : pointer to ADT. Description: This function frees the storage associated with an xxt handle Usage: XXT_free(xxt_handle); */ PETSC_INTERN PetscErrorCode XXT_free(xxt_ADT); /* Function: XXT_factor Input : ADT ptr, and pointer to object Return: 0 on failure, 1 on success Description: This function sets the xxt solver xxt assumptions: given n rows of global coarse matrix (E_loc) where o global dofs N = sum_p(n), p=0,P-1 (i.e. row dist. with no dof replication) (5.21.00 will handle dif replication case) o m is the number of columns in E_loc (m>=n) o local2global holds global number of column i (i=0,...,m-1) o local2global holds global number of row i (i=0,...,n-1) o mylocmatvec performs E_loc . x_loc where x_loc is an vector of length m in 1-1 correspondence with local2global (note that gs package takes care of communication). (note do not zero out upper m-n entries!) o mylocmatvec(void *grid_data, double *in, double *out) ML beliefs/usage: move this to ML_XXT_factor routine o my_ml holds address of ML struct associated w/E_loc, grid_data, grid_tag o grid_tag, grid_data, my_ml used in ML_Set_CSolve(my_ml, grid_tag, grid_data, ML_Do_CoarseDirect); o grid_data used in A_matvec(grid_data,v,u); Usage: */ PETSC_INTERN PetscErrorCode XXT_factor(xxt_ADT, /* prev. allocated xxt handle */ PetscInt *, /* global column mapping */ PetscInt, /* local num rows */ PetscInt, /* local num cols */ PetscErrorCode (*)(void *, PetscScalar *, PetscScalar *), /* b_loc=A_local.x_loc */ void *); /* grid data for matvec */ /* Function: XXT_solve Input : ADT ptr, b (rhs) Output: x (soln) Return: Description: This function performs x = E^-1.b Usage: XXT_solve(xxt_handle, double *x, double *b) XXT_solve(xxt_handle, double *x, NULL) assumes x has been initialized to be b */ PETSC_INTERN PetscErrorCode XXT_solve(xxt_ADT, PetscScalar *, PetscScalar *); /* Function: XXT_sp_1() Input : pointer to ADT Output: Return: Description: sets xxt parameter 1 in xxt_handle Usage: implement later void XXT_sp_1(xxt_handle,parameter 1 value) */ /* Module Name: xyt Module Info: need xyt.{c,h} gs.{c,h} comm.{c,h} ivec.{c,h} error.{c,h} author: Henry M. Tufo III e-mail: hmt@asci.uchicago.edu contact: +--------------------------------+--------------------------------+ |MCS Division - Building 221 |Department of Computer Science | |Argonne National Laboratory |Ryerson 152 | |9700 S. Cass Avenue |The University of Chicago | |Argonne, IL 60439 |Chicago, IL 60637 | |(630) 252-5354/5986 ph/fx |(773) 702-6019/8487 ph/fx | +--------------------------------+--------------------------------+ Last Modification: 3.20.01 */ typedef struct xyt_CDT *xyt_ADT; /* Function: XYT_new() Return: ADT ptr or NULL upon failure. Description: This function allocates and returns an xyt handle Usage: xyt_handle = xyt_new(); */ PETSC_INTERN xyt_ADT XYT_new(void); /* Function: XYT_free() Input : pointer to ADT. Description: This function frees the storage associated with an xyt handle Usage: XYT_free(xyt_handle); */ PETSC_INTERN PetscErrorCode XYT_free(xyt_ADT); /* Function: XYT_factor Input : ADT ptr, and pointer to object Output: Return: 0 on failure, 1 on success Description: This function sets the xyt solver xyt assumptions: given n rows of global coarse matrix (E_loc) where o global dofs N = sum_p(n), p=0,P-1 (i.e. row dist. with no dof replication) (5.21.00 will handle dif replication case) o m is the number of columns in E_loc (m>=n) o local2global holds global number of column i (i=0,...,m-1) o local2global holds global number of row i (i=0,...,n-1) o mylocmatvec performs E_loc . x_loc where x_loc is an vector of length m in 1-1 correspondence with local2global (note that gs package takes care of communication). (note do not zero out upper m-n entries!) o mylocmatvec(void *grid_data, double *in, double *out) ML beliefs/usage: move this to ML_XYT_factor routine o my_ml holds address of ML struct associated w/E_loc, grid_data, grid_tag o grid_tag, grid_data, my_ml used in ML_Set_CSolve(my_ml, grid_tag, grid_data, ML_Do_CoarseDirect); o grid_data used in A_matvec(grid_data,v,u); Usage: */ PETSC_INTERN PetscErrorCode XYT_factor(xyt_ADT, /* prev. allocated xyt handle */ PetscInt *, /* global column mapping */ PetscInt, /* local num rows */ PetscInt, /* local num cols */ PetscErrorCode (*)(void *, PetscScalar *, PetscScalar *), /* b_loc=A_local.x_loc */ void *); /* grid data for matvec */ /* Function: XYT_solve Input : ADT ptr, b (rhs) Output: x (soln) Return: Description: This function performs x = E^-1.b Usage: XYT_solve(xyt_handle, double *x, double *b) */ PETSC_INTERN PetscErrorCode XYT_solve(xyt_ADT, PetscScalar *, PetscScalar *); /* Function: XYT_stats Input : handle */ PETSC_INTERN PetscErrorCode XYT_stats(xyt_ADT); /* Author: Henry M. Tufo III e-mail: hmt@cs.brown.edu snail-mail: Division of Applied Mathematics Brown University Providence, RI 02912 Last Modification: 11.21.97 */ PETSC_INTERN PetscInt PCTFS_div_ceil(PetscInt, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_set_bit_mask(PetscInt *, PetscInt, PetscInt); PETSC_INTERN PetscInt PCTFS_len_bit_mask(PetscInt); PETSC_INTERN PetscInt PCTFS_ct_bits(char *, PetscInt); PETSC_INTERN PetscErrorCode PCTFS_bm_to_proc(char *, PetscInt, PetscInt *); PETSC_INTERN PetscInt PCTFS_len_buf(PetscInt, PetscInt);