1 #include <../src/ksp/pc/impls/bddc/bddc.h> 2 #include <../src/ksp/pc/impls/bddc/bddcprivate.h> 3 4 /* prototypes for deluxe functions */ 5 static PetscErrorCode PCBDDCScalingCreate_Deluxe(PC); 6 static PetscErrorCode PCBDDCScalingDestroy_Deluxe(PC); 7 static PetscErrorCode PCBDDCScalingSetUp_Deluxe(PC); 8 static PetscErrorCode PCBDDCScalingSetUp_Deluxe_Par(PC,PetscInt,PetscInt,PetscInt[],PetscInt[]); 9 static PetscErrorCode PCBDDCScalingSetUp_Deluxe_Seq(PC,PetscInt,PetscInt,PetscInt[],PetscInt[]); 10 static PetscErrorCode PCBDDCScalingReset_Deluxe_Solvers(PCBDDCDeluxeScaling); 11 12 #undef __FUNCT__ 13 #define __FUNCT__ "PCBDDCScalingExtension_Basic" 14 static PetscErrorCode PCBDDCScalingExtension_Basic(PC pc, Vec local_interface_vector, Vec global_vector) 15 { 16 PC_IS* pcis = (PC_IS*)pc->data; 17 PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 18 PetscErrorCode ierr; 19 20 PetscFunctionBegin; 21 /* Apply partition of unity */ 22 ierr = VecPointwiseMult(pcbddc->work_scaling,pcis->D,local_interface_vector);CHKERRQ(ierr); 23 ierr = VecSet(global_vector,0.0);CHKERRQ(ierr); 24 ierr = VecScatterBegin(pcis->global_to_B,pcbddc->work_scaling,global_vector,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 25 ierr = VecScatterEnd(pcis->global_to_B,pcbddc->work_scaling,global_vector,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 26 PetscFunctionReturn(0); 27 } 28 29 #undef __FUNCT__ 30 #define __FUNCT__ "PCBDDCScalingExtension_Deluxe" 31 static PetscErrorCode PCBDDCScalingExtension_Deluxe(PC pc, Vec x, Vec y) 32 { 33 PC_IS* pcis=(PC_IS*)pc->data; 34 PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 35 PCBDDCDeluxeScaling deluxe_ctx = pcbddc->deluxe_ctx; 36 PCBDDCSubSchurs sub_schurs = deluxe_ctx->sub_schurs; 37 PetscInt i; 38 PetscErrorCode ierr; 39 40 /* TODO CHECK STUFF RELATED WITH FAKE WORK */ 41 PetscFunctionBegin; 42 ierr = VecSet(pcbddc->work_scaling,0.0);CHKERRQ(ierr); /* needed by the fake work below */ 43 if (deluxe_ctx->n_simple) { 44 /* scale deluxe vertices using diagonal scaling */ 45 PetscScalar *array_x,*array_D,*array; 46 ierr = VecGetArray(x,&array_x);CHKERRQ(ierr); 47 ierr = VecGetArray(pcis->D,&array_D);CHKERRQ(ierr); 48 ierr = VecGetArray(pcbddc->work_scaling,&array);CHKERRQ(ierr); 49 for (i=0;i<deluxe_ctx->n_simple;i++) { 50 array[deluxe_ctx->idx_simple_B[i]] = array_x[deluxe_ctx->idx_simple_B[i]]*array_D[deluxe_ctx->idx_simple_B[i]]; 51 } 52 ierr = VecRestoreArray(pcbddc->work_scaling,&array);CHKERRQ(ierr); 53 ierr = VecRestoreArray(pcis->D,&array_D);CHKERRQ(ierr); 54 ierr = VecRestoreArray(x,&array_x);CHKERRQ(ierr); 55 } 56 /* sequential part : all problems and Schur applications collapsed into a single matrix vector multiplication and ksp solution */ 57 if (deluxe_ctx->seq_mat) { 58 ierr = VecScatterBegin(deluxe_ctx->seq_scctx,x,deluxe_ctx->seq_work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 59 ierr = VecScatterEnd(deluxe_ctx->seq_scctx,x,deluxe_ctx->seq_work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 60 ierr = MatMult(deluxe_ctx->seq_mat,deluxe_ctx->seq_work1,deluxe_ctx->seq_work2);CHKERRQ(ierr); 61 ierr = KSPSolve(deluxe_ctx->seq_ksp,deluxe_ctx->seq_work2,deluxe_ctx->seq_work1);CHKERRQ(ierr); 62 /* fake work due to final ADD VALUES and vertices scaling needed? TODO: check it */ 63 ierr = VecScatterBegin(deluxe_ctx->seq_scctx,deluxe_ctx->seq_work1,pcbddc->work_scaling,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 64 ierr = VecScatterEnd(deluxe_ctx->seq_scctx,deluxe_ctx->seq_work1,pcbddc->work_scaling,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 65 } 66 /* parallel part */ 67 for (i=0;i<deluxe_ctx->par_colors;i++) { 68 if (deluxe_ctx->par_ksp[i]) { 69 PetscMPIInt color_rank; 70 PetscInt subidx = deluxe_ctx->par_col2sub[i]; 71 /* restrict on subset */ 72 ierr = VecScatterBegin(deluxe_ctx->par_scctx_s[i],x,sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 73 ierr = VecScatterEnd(deluxe_ctx->par_scctx_s[i],x,sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 74 /* S_Ej */ 75 ierr = MatMult(sub_schurs->S_Ej[subidx],sub_schurs->work1[subidx],sub_schurs->work2[subidx]);CHKERRQ(ierr); 76 /* (\sum_j S_Ej)^-1 */ 77 ierr = VecSet(deluxe_ctx->par_vec[i],0.0);CHKERRQ(ierr); 78 ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],sub_schurs->work2[subidx],deluxe_ctx->par_vec[i],ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 79 ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],sub_schurs->work2[subidx],deluxe_ctx->par_vec[i],ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 80 ierr = KSPSolve(deluxe_ctx->par_ksp[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_vec[i]);CHKERRQ(ierr); 81 ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)deluxe_ctx->par_ksp[i]),&color_rank);CHKERRQ(ierr); 82 /* get back solution on subset */ 83 ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 84 ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 85 if (!color_rank) { /* only the master process in coloured comm copies the computed values */ 86 ierr = VecScatterBegin(deluxe_ctx->par_scctx_s[i],sub_schurs->work1[subidx],pcbddc->work_scaling,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 87 ierr = VecScatterEnd(deluxe_ctx->par_scctx_s[i],sub_schurs->work1[subidx],pcbddc->work_scaling,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 88 } 89 } 90 } 91 /* put local boundary part in global vector */ 92 ierr = VecSet(y,0.0);CHKERRQ(ierr); 93 ierr = VecScatterBegin(pcis->global_to_B,pcbddc->work_scaling,y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 94 ierr = VecScatterEnd(pcis->global_to_B,pcbddc->work_scaling,y,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 95 PetscFunctionReturn(0); 96 } 97 98 #undef __FUNCT__ 99 #define __FUNCT__ "PCBDDCScalingExtension" 100 PetscErrorCode PCBDDCScalingExtension(PC pc, Vec local_interface_vector, Vec global_vector) 101 { 102 PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 103 PetscErrorCode ierr; 104 105 PetscFunctionBegin; 106 PetscValidHeaderSpecific(pc,PC_CLASSID,1); 107 PetscValidHeaderSpecific(local_interface_vector,VEC_CLASSID,2); 108 PetscValidHeaderSpecific(global_vector,VEC_CLASSID,3); 109 if (local_interface_vector == pcbddc->work_scaling) { 110 SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_SUP,"Local vector cannot be pcbddc->work_scaling!\n"); 111 } 112 ierr = PetscTryMethod(pc,"PCBDDCScalingExtension_C",(PC,Vec,Vec),(pc,local_interface_vector,global_vector));CHKERRQ(ierr); 113 PetscFunctionReturn(0); 114 } 115 116 #undef __FUNCT__ 117 #define __FUNCT__ "PCBDDCScalingRestriction_Basic" 118 static PetscErrorCode PCBDDCScalingRestriction_Basic(PC pc, Vec global_vector, Vec local_interface_vector) 119 { 120 PetscErrorCode ierr; 121 PC_IS* pcis = (PC_IS*)pc->data; 122 123 PetscFunctionBegin; 124 ierr = VecScatterBegin(pcis->global_to_B,global_vector,local_interface_vector,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 125 ierr = VecScatterEnd(pcis->global_to_B,global_vector,local_interface_vector,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 126 /* Apply partition of unity */ 127 ierr = VecPointwiseMult(local_interface_vector,pcis->D,local_interface_vector);CHKERRQ(ierr); 128 PetscFunctionReturn(0); 129 } 130 131 #undef __FUNCT__ 132 #define __FUNCT__ "PCBDDCScalingRestriction_Deluxe" 133 static PetscErrorCode PCBDDCScalingRestriction_Deluxe(PC pc, Vec x, Vec y) 134 { 135 PC_IS* pcis=(PC_IS*)pc->data; 136 PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 137 PCBDDCDeluxeScaling deluxe_ctx = pcbddc->deluxe_ctx; 138 PCBDDCSubSchurs sub_schurs = deluxe_ctx->sub_schurs; 139 PetscInt i; 140 PetscErrorCode ierr; 141 142 PetscFunctionBegin; 143 /* get local boundary part of global vector */ 144 ierr = VecScatterBegin(pcis->global_to_B,x,y,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 145 ierr = VecScatterEnd(pcis->global_to_B,x,y,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 146 if (deluxe_ctx->n_simple) { 147 /* scale deluxe vertices using diagonal scaling */ 148 PetscScalar *array_y,*array_D; 149 ierr = VecGetArray(y,&array_y);CHKERRQ(ierr); 150 ierr = VecGetArray(pcis->D,&array_D);CHKERRQ(ierr); 151 for (i=0;i<deluxe_ctx->n_simple;i++) { 152 array_y[deluxe_ctx->idx_simple_B[i]] *= array_D[deluxe_ctx->idx_simple_B[i]]; 153 } 154 ierr = VecRestoreArray(pcis->D,&array_D);CHKERRQ(ierr); 155 ierr = VecRestoreArray(y,&array_y);CHKERRQ(ierr); 156 } 157 /* sequential part : all problems and Schur applications collapsed into a single matrix vector multiplication and ksp solution */ 158 if (deluxe_ctx->seq_mat) { 159 ierr = VecScatterBegin(deluxe_ctx->seq_scctx,y,deluxe_ctx->seq_work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 160 ierr = VecScatterEnd(deluxe_ctx->seq_scctx,y,deluxe_ctx->seq_work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 161 ierr = KSPSolveTranspose(deluxe_ctx->seq_ksp,deluxe_ctx->seq_work1,deluxe_ctx->seq_work2);CHKERRQ(ierr); 162 ierr = MatMultTranspose(deluxe_ctx->seq_mat,deluxe_ctx->seq_work2,deluxe_ctx->seq_work1);CHKERRQ(ierr); 163 ierr = VecScatterBegin(deluxe_ctx->seq_scctx,deluxe_ctx->seq_work1,y,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 164 ierr = VecScatterEnd(deluxe_ctx->seq_scctx,deluxe_ctx->seq_work1,y,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 165 } 166 /* parallel part */ 167 for (i=0;i<deluxe_ctx->par_colors;i++) { 168 if (deluxe_ctx->par_ksp[i]) { 169 PetscInt subidx = deluxe_ctx->par_col2sub[i]; 170 /* restrict on subset */ 171 ierr = VecScatterBegin(deluxe_ctx->par_scctx_s[i],y,sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 172 ierr = VecScatterEnd(deluxe_ctx->par_scctx_s[i],y,sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 173 /* (\sum_j S_Ej)^-T */ 174 ierr = VecSet(deluxe_ctx->par_vec[i],0.0);CHKERRQ(ierr); 175 ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],sub_schurs->work1[subidx],deluxe_ctx->par_vec[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 176 ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],sub_schurs->work1[subidx],deluxe_ctx->par_vec[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 177 ierr = KSPSolveTranspose(deluxe_ctx->par_ksp[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_vec[i]);CHKERRQ(ierr); 178 ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 179 ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 180 /* S_Ej^T */ 181 ierr = MatMultTranspose(sub_schurs->S_Ej[subidx],sub_schurs->work1[subidx],sub_schurs->work2[subidx]);CHKERRQ(ierr); 182 /* extend to boundary */ 183 ierr = VecScatterBegin(deluxe_ctx->par_scctx_s[i],sub_schurs->work2[subidx],y,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 184 ierr = VecScatterEnd(deluxe_ctx->par_scctx_s[i],sub_schurs->work2[subidx],y,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 185 } 186 } 187 PetscFunctionReturn(0); 188 } 189 190 #undef __FUNCT__ 191 #define __FUNCT__ "PCBDDCScalingRestriction" 192 PetscErrorCode PCBDDCScalingRestriction(PC pc, Vec global_vector, Vec local_interface_vector) 193 { 194 PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 195 PetscErrorCode ierr; 196 197 PetscFunctionBegin; 198 PetscValidHeaderSpecific(pc,PC_CLASSID,1); 199 PetscValidHeaderSpecific(global_vector,VEC_CLASSID,2); 200 PetscValidHeaderSpecific(local_interface_vector,VEC_CLASSID,3); 201 if (local_interface_vector == pcbddc->work_scaling) { 202 SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_SUP,"Local vector should cannot be pcbddc->work_scaling!\n"); 203 } 204 ierr = PetscTryMethod(pc,"PCBDDCScalingRestriction_C",(PC,Vec,Vec),(pc,global_vector,local_interface_vector));CHKERRQ(ierr); 205 PetscFunctionReturn(0); 206 } 207 208 #undef __FUNCT__ 209 #define __FUNCT__ "PCBDDCScalingSetUp" 210 PetscErrorCode PCBDDCScalingSetUp(PC pc) 211 { 212 PC_IS* pcis=(PC_IS*)pc->data; 213 PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 214 PetscErrorCode ierr; 215 216 PetscFunctionBegin; 217 PetscValidHeaderSpecific(pc,PC_CLASSID,1); 218 /* create work vector for the operator */ 219 ierr = VecDestroy(&pcbddc->work_scaling);CHKERRQ(ierr); 220 ierr = VecDuplicate(pcis->vec1_B,&pcbddc->work_scaling);CHKERRQ(ierr); 221 /* always rebuild pcis->D */ 222 if (pcis->use_stiffness_scaling) { 223 ierr = MatGetDiagonal(pcbddc->local_mat,pcis->vec1_N);CHKERRQ(ierr); 224 ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 225 ierr = VecScatterEnd(pcis->N_to_B,pcis->vec1_N,pcis->D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 226 } 227 ierr = VecCopy(pcis->D,pcis->vec1_B);CHKERRQ(ierr); 228 ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 229 ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 230 ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 231 ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_global,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 232 ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_global,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 233 ierr = VecPointwiseDivide(pcis->D,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 234 /* now setup */ 235 if (pcbddc->use_deluxe_scaling) { 236 if (!pcbddc->deluxe_ctx) { 237 ierr = PCBDDCScalingCreate_Deluxe(pc);CHKERRQ(ierr); 238 } 239 ierr = PCBDDCScalingSetUp_Deluxe(pc);CHKERRQ(ierr); 240 ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingRestriction_C",PCBDDCScalingRestriction_Deluxe);CHKERRQ(ierr); 241 ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingExtension_C",PCBDDCScalingExtension_Deluxe);CHKERRQ(ierr); 242 } else { 243 ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingRestriction_C",PCBDDCScalingRestriction_Basic);CHKERRQ(ierr); 244 ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingExtension_C",PCBDDCScalingExtension_Basic);CHKERRQ(ierr); 245 } 246 247 /* test */ 248 if (pcbddc->dbg_flag) { 249 Vec vec2_global; 250 PetscViewer viewer=pcbddc->dbg_viewer; 251 PetscReal error; 252 253 /* extension -> from local to parallel */ 254 ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 255 ierr = VecSetRandom(pcis->vec1_B,NULL);CHKERRQ(ierr); 256 ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 257 ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 258 ierr = VecDuplicate(pcis->vec1_global,&vec2_global);CHKERRQ(ierr); 259 ierr = VecCopy(pcis->vec1_global,vec2_global);CHKERRQ(ierr); 260 261 ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_global,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 262 ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_global,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 263 ierr = PCBDDCScalingExtension(pc,pcis->vec1_B,pcis->vec1_global);CHKERRQ(ierr); 264 ierr = VecAXPY(pcis->vec1_global,-1.0,vec2_global);CHKERRQ(ierr); 265 ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&error);CHKERRQ(ierr); 266 ierr = PetscViewerASCIIPrintf(viewer,"Error scaling extension %1.14e\n",error);CHKERRQ(ierr); 267 if (error>1.e-8 && pcbddc->dbg_flag>1) { 268 ierr = VecView(pcis->vec1_global,viewer);CHKERRQ(ierr); 269 } 270 ierr = VecDestroy(&vec2_global);CHKERRQ(ierr); 271 272 /* restriction -> from parallel to local */ 273 ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 274 ierr = VecSetRandom(pcis->vec1_B,NULL);CHKERRQ(ierr); 275 ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 276 ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 277 278 ierr = PCBDDCScalingRestriction(pc,pcis->vec1_global,pcis->vec1_B);CHKERRQ(ierr); 279 ierr = VecScale(pcis->vec1_B,-1.0);CHKERRQ(ierr); 280 ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 281 ierr = VecScatterEnd(pcis->global_to_B,pcis->vec1_B,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 282 ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&error);CHKERRQ(ierr); 283 ierr = PetscViewerASCIIPrintf(viewer,"Error scaling restriction %1.14e\n",error);CHKERRQ(ierr); 284 if (error>1.e-8 && pcbddc->dbg_flag>1) { 285 ierr = VecView(pcis->vec1_global,viewer);CHKERRQ(ierr); 286 } 287 } 288 PetscFunctionReturn(0); 289 } 290 291 #undef __FUNCT__ 292 #define __FUNCT__ "PCBDDCScalingDestroy" 293 PetscErrorCode PCBDDCScalingDestroy(PC pc) 294 { 295 PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 296 PetscErrorCode ierr; 297 298 PetscFunctionBegin; 299 if (pcbddc->deluxe_ctx) { 300 ierr = PCBDDCScalingDestroy_Deluxe(pc);CHKERRQ(ierr); 301 } 302 ierr = VecDestroy(&pcbddc->work_scaling);CHKERRQ(ierr); 303 /* remove functions */ 304 ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingRestriction_C",NULL);CHKERRQ(ierr); 305 ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCScalingExtension_C",NULL);CHKERRQ(ierr); 306 PetscFunctionReturn(0); 307 } 308 309 #undef __FUNCT__ 310 #define __FUNCT__ "PCBDDCScalingCreate_Deluxe" 311 static PetscErrorCode PCBDDCScalingCreate_Deluxe(PC pc) 312 { 313 PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 314 PCBDDCDeluxeScaling deluxe_ctx; 315 PetscErrorCode ierr; 316 317 PetscFunctionBegin; 318 ierr = PetscNew(&deluxe_ctx);CHKERRQ(ierr); 319 ierr = PCBDDCSubSchursCreate(&deluxe_ctx->sub_schurs);CHKERRQ(ierr); 320 pcbddc->deluxe_ctx = deluxe_ctx; 321 PetscFunctionReturn(0); 322 } 323 324 #undef __FUNCT__ 325 #define __FUNCT__ "PCBDDCScalingDestroy_Deluxe" 326 static PetscErrorCode PCBDDCScalingDestroy_Deluxe(PC pc) 327 { 328 PC_BDDC* pcbddc=(PC_BDDC*)pc->data; 329 PetscErrorCode ierr; 330 331 PetscFunctionBegin; 332 ierr = PCBDDCScalingReset_Deluxe_Solvers(pcbddc->deluxe_ctx);CHKERRQ(ierr); 333 ierr = PCBDDCSubSchursDestroy(&(pcbddc->deluxe_ctx->sub_schurs));CHKERRQ(ierr); 334 ierr = PetscFree(pcbddc->deluxe_ctx);CHKERRQ(ierr); 335 PetscFunctionReturn(0); 336 } 337 338 #undef __FUNCT__ 339 #define __FUNCT__ "PCBDDCScalingReset_Deluxe_Solvers" 340 static PetscErrorCode PCBDDCScalingReset_Deluxe_Solvers(PCBDDCDeluxeScaling deluxe_ctx) 341 { 342 PetscErrorCode ierr; 343 344 PetscFunctionBegin; 345 ierr = PetscFree(deluxe_ctx->idx_simple_B);CHKERRQ(ierr); 346 deluxe_ctx->n_simple = 0; 347 if (deluxe_ctx->seq_mat) { 348 ierr = VecScatterDestroy(&deluxe_ctx->seq_scctx);CHKERRQ(ierr); 349 ierr = VecDestroy(&deluxe_ctx->seq_work1);CHKERRQ(ierr); 350 ierr = VecDestroy(&deluxe_ctx->seq_work2);CHKERRQ(ierr); 351 ierr = MatDestroy(&deluxe_ctx->seq_mat);CHKERRQ(ierr); 352 ierr = KSPDestroy(&deluxe_ctx->seq_ksp);CHKERRQ(ierr); 353 } 354 if (deluxe_ctx->par_colors) { 355 PetscInt i; 356 for (i=0;i<deluxe_ctx->par_colors;i++) { 357 ierr = VecScatterDestroy(&deluxe_ctx->par_scctx_s[i]);CHKERRQ(ierr); 358 ierr = VecScatterDestroy(&deluxe_ctx->par_scctx_p[i]);CHKERRQ(ierr); 359 ierr = VecDestroy(&deluxe_ctx->par_vec[i]);CHKERRQ(ierr); 360 ierr = KSPDestroy(&deluxe_ctx->par_ksp[i]);CHKERRQ(ierr); 361 } 362 ierr = PetscFree5(deluxe_ctx->par_ksp, 363 deluxe_ctx->par_scctx_s, 364 deluxe_ctx->par_scctx_p, 365 deluxe_ctx->par_vec, 366 deluxe_ctx->par_col2sub);CHKERRQ(ierr); 367 } 368 deluxe_ctx->par_colors = 0; 369 PetscFunctionReturn(0); 370 } 371 372 #undef __FUNCT__ 373 #define __FUNCT__ "PCBDDCScalingSetUp_Deluxe" 374 static PetscErrorCode PCBDDCScalingSetUp_Deluxe(PC pc) 375 { 376 PC_IS *pcis=(PC_IS*)pc->data; 377 PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 378 PCBDDCDeluxeScaling deluxe_ctx=pcbddc->deluxe_ctx; 379 PCBDDCSubSchurs sub_schurs=deluxe_ctx->sub_schurs; 380 PCBDDCGraph graph; 381 IS *faces,*edges,*all_cc; 382 PetscBT bitmask; 383 PetscInt *index_sequential,*index_parallel; 384 PetscInt *auxlocal_sequential,*auxlocal_parallel; 385 PetscInt *auxglobal_sequential,*auxglobal_parallel; 386 PetscInt *auxmapping,*idxs; 387 PetscInt i,max_subset_size; 388 PetscInt n_sequential_problems,n_local_sequential_problems,n_parallel_problems,n_local_parallel_problems; 389 PetscInt n_faces,n_edges,n_all_cc; 390 PetscErrorCode ierr; 391 392 PetscFunctionBegin; 393 /* throw away the solvers */ 394 ierr = PCBDDCScalingReset_Deluxe_Solvers(deluxe_ctx);CHKERRQ(ierr); 395 396 /* attach interface graph for determining subsets */ 397 if (pcbddc->deluxe_rebuild) { /* in case rebuild has been requested, it uses a graph generated only by the neighbouring information */ 398 PetscInt *idx_V_N; 399 IS verticesIS; 400 ierr = PCBDDCGetPrimalVerticesLocalIdx(pc,&i,&idx_V_N);CHKERRQ(ierr); 401 ierr = ISCreateGeneral(PETSC_COMM_SELF,i,idx_V_N,PETSC_OWN_POINTER,&verticesIS);CHKERRQ(ierr); 402 ierr = PCBDDCGraphCreate(&graph);CHKERRQ(ierr); 403 ierr = PCBDDCGraphInit(graph,pcbddc->mat_graph->l2gmap);CHKERRQ(ierr); 404 ierr = PCBDDCGraphSetUp(graph,0,NULL,pcbddc->DirichletBoundariesLocal,0,NULL,verticesIS);CHKERRQ(ierr); 405 ierr = PCBDDCGraphComputeConnectedComponents(graph);CHKERRQ(ierr); 406 ierr = ISDestroy(&verticesIS);CHKERRQ(ierr); 407 /* 408 if (pcbddc->dbg_flag) { 409 ierr = PCBDDCGraphASCIIView(graph,pcbddc->dbg_flag,pcbddc->dbg_viewer);CHKERRQ(ierr); 410 } 411 */ 412 } else { 413 graph = pcbddc->mat_graph; 414 } 415 416 /* get index sets for faces and edges */ 417 ierr = PCBDDCGraphGetCandidatesIS(graph,&n_faces,&faces,&n_edges,&edges,NULL);CHKERRQ(ierr); 418 n_all_cc = n_faces+n_edges; 419 ierr = PetscMalloc1(n_all_cc,&all_cc);CHKERRQ(ierr); 420 for (i=0;i<n_faces;i++) { 421 all_cc[i] = faces[i]; 422 } 423 for (i=0;i<n_edges;i++) { 424 all_cc[n_faces+i] = edges[i]; 425 } 426 ierr = PetscFree(faces);CHKERRQ(ierr); 427 ierr = PetscFree(edges);CHKERRQ(ierr); 428 429 /* map interface's subsets */ 430 max_subset_size = 0; 431 for (i=0;i<n_all_cc;i++) { 432 PetscInt subset_size; 433 ierr = ISGetLocalSize(all_cc[i],&subset_size);CHKERRQ(ierr); 434 max_subset_size = PetscMax(max_subset_size,subset_size); 435 } 436 ierr = PetscMalloc5(max_subset_size,&auxmapping, 437 graph->ncc,&auxlocal_sequential, 438 graph->ncc,&auxlocal_parallel, 439 graph->ncc,&index_sequential, 440 graph->ncc,&index_parallel);CHKERRQ(ierr); 441 442 /* if threshold is negative, uses all sequential problems */ 443 if (pcbddc->deluxe_threshold < 0) pcbddc->deluxe_threshold = max_subset_size; 444 445 /* workspace */ 446 ierr = PetscBTCreate(pcis->n,&bitmask);CHKERRQ(ierr); 447 ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&idxs);CHKERRQ(ierr); 448 for (i=0;i<pcis->n-pcis->n_B;i++) { 449 ierr = PetscBTSet(bitmask,idxs[i]);CHKERRQ(ierr); 450 } 451 ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&idxs);CHKERRQ(ierr); 452 453 /* determine which problem has to be solved in parallel or sequentially */ 454 n_local_sequential_problems = 0; 455 n_local_parallel_problems = 0; 456 for (i=0;i<n_all_cc;i++) { 457 PetscInt subset_size,j,min_loc = 0; 458 459 ierr = ISGetLocalSize(all_cc[i],&subset_size);CHKERRQ(ierr); 460 ierr = ISGetIndices(all_cc[i],(const PetscInt**)&idxs);CHKERRQ(ierr); 461 for (j=0;j<subset_size;j++) { 462 ierr = PetscBTSet(bitmask,idxs[j]);CHKERRQ(ierr); 463 } 464 ierr = ISLocalToGlobalMappingApply(graph->l2gmap,subset_size,idxs,auxmapping);CHKERRQ(ierr); 465 for (j=1;j<subset_size;j++) { 466 if (auxmapping[j]<auxmapping[min_loc]) { 467 min_loc = j; 468 } 469 } 470 if (subset_size > pcbddc->deluxe_threshold) { 471 index_parallel[n_local_parallel_problems] = i; 472 auxlocal_parallel[n_local_parallel_problems] = idxs[min_loc]; 473 n_local_parallel_problems++; 474 } else { 475 index_sequential[n_local_sequential_problems] = i; 476 auxlocal_sequential[n_local_sequential_problems] = idxs[min_loc]; 477 n_local_sequential_problems++; 478 } 479 ierr = ISRestoreIndices(all_cc[i],(const PetscInt**)&idxs);CHKERRQ(ierr); 480 } 481 482 /* diagonal scaling on interface dofs not contained in cc */ 483 deluxe_ctx->n_simple = 0; 484 for (i=0;i<pcis->n;i++) { 485 if (!PetscBTLookup(bitmask,i)) { 486 deluxe_ctx->n_simple++; 487 } 488 } 489 ierr = PetscMalloc1(deluxe_ctx->n_simple,&deluxe_ctx->idx_simple_B);CHKERRQ(ierr); 490 deluxe_ctx->n_simple = 0; 491 for (i=0;i<pcis->n;i++) { 492 if (!PetscBTLookup(bitmask,i)) { 493 deluxe_ctx->idx_simple_B[deluxe_ctx->n_simple++] = i; 494 } 495 } 496 ierr = ISGlobalToLocalMappingApply(pcbddc->BtoNmap,IS_GTOLM_DROP,deluxe_ctx->n_simple,deluxe_ctx->idx_simple_B,&i,deluxe_ctx->idx_simple_B);CHKERRQ(ierr); 497 if (i != deluxe_ctx->n_simple) { 498 SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error when mapping simple scaling dofs! %d != %d",i,deluxe_ctx->n_simple); 499 } 500 ierr = PetscBTDestroy(&bitmask);CHKERRQ(ierr); 501 502 /* SetUp local schur complements on subsets TODO better reuse procedure */ 503 if (!sub_schurs->n_subs) { 504 Mat S_j; 505 PetscBool free_used_adj; 506 PetscInt *used_xadj,*used_adjncy; 507 508 /* decide the adjacency to be used for determining internal problems for local schur on subsets */ 509 free_used_adj = PETSC_FALSE; 510 if (pcbddc->deluxe_layers == -1) { 511 used_xadj = NULL; 512 used_adjncy = NULL; 513 } else { 514 if ((pcbddc->deluxe_use_useradj && pcbddc->mat_graph->xadj) || !pcbddc->deluxe_compute_rowadj) { 515 used_xadj = pcbddc->mat_graph->xadj; 516 used_adjncy = pcbddc->mat_graph->adjncy; 517 } else { 518 Mat mat_adj; 519 PetscBool flg_row=PETSC_TRUE; 520 const PetscInt *xadj,*adjncy; 521 PetscInt nvtxs; 522 523 ierr = MatConvert(pcbddc->local_mat,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr); 524 ierr = MatGetRowIJ(mat_adj,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 525 if (!flg_row) { 526 SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__); 527 } 528 ierr = PetscMalloc2(nvtxs+1,&used_xadj,xadj[nvtxs],&used_adjncy);CHKERRQ(ierr); 529 ierr = PetscMemcpy(used_xadj,xadj,(nvtxs+1)*sizeof(*xadj));CHKERRQ(ierr); 530 ierr = PetscMemcpy(used_adjncy,adjncy,(xadj[nvtxs])*sizeof(*adjncy));CHKERRQ(ierr); 531 ierr = MatRestoreRowIJ(mat_adj,0,PETSC_TRUE,PETSC_FALSE,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 532 if (!flg_row) { 533 SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__); 534 } 535 ierr = MatDestroy(&mat_adj);CHKERRQ(ierr); 536 free_used_adj = PETSC_TRUE; 537 } 538 } 539 540 /* Create Schur complement matrix */ 541 ierr = MatCreateSchurComplement(pcis->A_II,pcis->A_II,pcis->A_IB,pcis->A_BI,pcis->A_BB,&S_j);CHKERRQ(ierr); 542 ierr = MatSchurComplementSetKSP(S_j,pcbddc->ksp_D);CHKERRQ(ierr); 543 544 /* setup Schur complements on subsets */ 545 ierr = PCBDDCSubSchursSetUp(sub_schurs,S_j,pcis->is_I_local,pcis->is_B_local,n_all_cc,all_cc,used_xadj,used_adjncy,pcbddc->deluxe_layers);CHKERRQ(ierr); 546 ierr = MatDestroy(&S_j);CHKERRQ(ierr); 547 /* free adjacency */ 548 if (free_used_adj) { 549 ierr = PetscFree2(used_xadj,used_adjncy);CHKERRQ(ierr); 550 } 551 } 552 for (i=0;i<n_all_cc;i++) { 553 ierr = ISDestroy(&all_cc[i]);CHKERRQ(ierr); 554 } 555 ierr = PetscFree(all_cc);CHKERRQ(ierr); 556 557 /* Number parallel problems */ 558 auxglobal_parallel = 0; 559 ierr = PCBDDCSubsetNumbering(PetscObjectComm((PetscObject)pc),graph->l2gmap,n_local_parallel_problems,auxlocal_parallel,PETSC_NULL,&n_parallel_problems,&auxglobal_parallel);CHKERRQ(ierr); 560 if (pcbddc->dbg_flag) { 561 ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Deluxe global number of parallel subproblems: %d\n",n_parallel_problems); 562 } 563 564 /* Compute data structures to solve parallel problems */ 565 ierr = PCBDDCScalingSetUp_Deluxe_Par(pc,n_local_parallel_problems,n_parallel_problems,auxglobal_parallel,index_parallel);CHKERRQ(ierr); 566 ierr = PetscFree(auxglobal_parallel);CHKERRQ(ierr); 567 568 569 /* Number sequential problems */ 570 auxglobal_sequential = 0; 571 ierr = PCBDDCSubsetNumbering(PetscObjectComm((PetscObject)pc),graph->l2gmap,n_local_sequential_problems,auxlocal_sequential,PETSC_NULL,&n_sequential_problems,&auxglobal_sequential);CHKERRQ(ierr); 572 if (pcbddc->dbg_flag) { 573 ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Deluxe global number of sequential subproblems: %d\n",n_sequential_problems); 574 } 575 576 /* Compute data structures to solve sequential problems */ 577 ierr = PCBDDCScalingSetUp_Deluxe_Seq(pc,n_local_sequential_problems,n_sequential_problems,auxglobal_sequential,index_sequential);CHKERRQ(ierr); 578 ierr = PetscFree(auxglobal_sequential);CHKERRQ(ierr); 579 580 /* free workspace */ 581 ierr = PetscFree5(auxmapping,auxlocal_sequential,auxlocal_parallel,index_sequential,index_parallel);CHKERRQ(ierr); 582 583 /* free graph struct */ 584 if (pcbddc->deluxe_rebuild) { 585 ierr = PCBDDCGraphDestroy(&graph);CHKERRQ(ierr); 586 } 587 PetscFunctionReturn(0); 588 } 589 590 #undef __FUNCT__ 591 #define __FUNCT__ "PCBDDCScalingSetUp_Deluxe_Par" 592 static PetscErrorCode PCBDDCScalingSetUp_Deluxe_Par(PC pc, PetscInt n_local_parallel_problems,PetscInt n_parallel_problems,PetscInt global_parallel[],PetscInt index_parallel[]) 593 { 594 PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 595 PCBDDCDeluxeScaling deluxe_ctx=pcbddc->deluxe_ctx; 596 /* coloring */ 597 Mat parallel_problems; 598 MatColoring coloring_obj; 599 ISColoring coloring_parallel_problems; 600 IS *par_is_colors,*is_colors; 601 /* working stuff */ 602 PetscInt i,j; 603 PetscErrorCode ierr; 604 605 PetscFunctionBegin; 606 if (!n_parallel_problems) { 607 PetscFunctionReturn(0); 608 } 609 /* Color parallel subproblems */ 610 ierr = MatCreate(PetscObjectComm((PetscObject)pc),¶llel_problems);CHKERRQ(ierr); 611 ierr = MatSetSizes(parallel_problems,PETSC_DECIDE,PETSC_DECIDE,n_parallel_problems,n_parallel_problems);CHKERRQ(ierr); 612 ierr = MatSetType(parallel_problems,MATAIJ);CHKERRQ(ierr); 613 ierr = MatSetUp(parallel_problems);CHKERRQ(ierr); 614 ierr = MatSetOption(parallel_problems,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 615 ierr = MatSetOption(parallel_problems,MAT_NEW_NONZERO_ALLOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 616 for (i=0;i<n_local_parallel_problems;i++) { 617 PetscInt row = global_parallel[i]; 618 for (j=0;j<n_local_parallel_problems;j++) { 619 PetscInt col = global_parallel[j]; 620 if (row != col) { 621 ierr = MatSetValue(parallel_problems,row,col,1.0,INSERT_VALUES);CHKERRQ(ierr); 622 } 623 } 624 } 625 ierr = MatAssemblyBegin(parallel_problems,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 626 ierr = MatAssemblyEnd(parallel_problems,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 627 if (pcbddc->dbg_flag > 1) { 628 ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 629 ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Adj matrix for deluxe parallel problems\n");CHKERRQ(ierr); 630 ierr = MatView(parallel_problems,pcbddc->dbg_viewer);CHKERRQ(ierr); 631 } 632 ierr = MatColoringCreate(parallel_problems,&coloring_obj);CHKERRQ(ierr); 633 ierr = MatColoringSetDistance(coloring_obj,1);CHKERRQ(ierr); 634 ierr = MatColoringSetType(coloring_obj,MATCOLORINGJP);CHKERRQ(ierr); 635 ierr = MatColoringApply(coloring_obj,&coloring_parallel_problems);CHKERRQ(ierr); 636 ierr = ISColoringGetIS(coloring_parallel_problems,&deluxe_ctx->par_colors,&par_is_colors);CHKERRQ(ierr); 637 if (pcbddc->dbg_flag) { 638 ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 639 ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Number of colors %d for parallel part of deluxe\n",deluxe_ctx->par_colors);CHKERRQ(ierr); 640 } 641 642 /* all procs should know the color distribution */ 643 ierr = PetscMalloc1(deluxe_ctx->par_colors,&is_colors);CHKERRQ(ierr); 644 for (i=0;i<deluxe_ctx->par_colors;i++) { 645 if (pcbddc->dbg_flag) { 646 ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Global problem indexes for color %d\n",i);CHKERRQ(ierr); 647 ierr = ISView(par_is_colors[i],pcbddc->dbg_viewer);CHKERRQ(ierr); 648 ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 649 } 650 ierr = ISAllGather(par_is_colors[i],&is_colors[i]);CHKERRQ(ierr); 651 } 652 653 /* free unneeded objects */ 654 ierr = ISColoringRestoreIS(coloring_parallel_problems,&par_is_colors);CHKERRQ(ierr); 655 ierr = ISColoringDestroy(&coloring_parallel_problems);CHKERRQ(ierr); 656 ierr = MatColoringDestroy(&coloring_obj);CHKERRQ(ierr); 657 ierr = MatDestroy(¶llel_problems);CHKERRQ(ierr); 658 659 /* allocate deluxe arrays for parallel problems */ 660 ierr = PetscMalloc5(deluxe_ctx->par_colors,&deluxe_ctx->par_ksp, 661 deluxe_ctx->par_colors,&deluxe_ctx->par_scctx_s, 662 deluxe_ctx->par_colors,&deluxe_ctx->par_scctx_p, 663 deluxe_ctx->par_colors,&deluxe_ctx->par_vec, 664 deluxe_ctx->par_colors,&deluxe_ctx->par_col2sub);CHKERRQ(ierr); 665 666 /* cycle on colors */ 667 for (i=0;i<deluxe_ctx->par_colors;i++) { 668 PetscSubcomm par_subcomm; 669 const PetscInt* idxs_subproblems; 670 PetscInt color_size; 671 PetscMPIInt rank,active_color; 672 673 /* get local index of i-th parallel colored problem */ 674 ierr = ISGetLocalSize(is_colors[i],&color_size);CHKERRQ(ierr); 675 ierr = ISGetIndices(is_colors[i],&idxs_subproblems);CHKERRQ(ierr); 676 /* split comm for computing parallel problems for this color */ 677 /* Processes not partecipating at this stage will have color = color_size */ 678 /* because PetscCommDuplicate does not handle MPI_COMM_NULL */ 679 active_color = color_size; 680 deluxe_ctx->par_col2sub[i] = -1; 681 for (j=0;j<n_local_parallel_problems;j++) { 682 PetscInt local_idx; 683 ierr = PetscFindInt(global_parallel[j],color_size,idxs_subproblems,&local_idx);CHKERRQ(ierr); 684 if (local_idx > -1) { 685 ierr = PetscMPIIntCast(local_idx,&active_color);CHKERRQ(ierr); 686 deluxe_ctx->par_col2sub[i] = index_parallel[j]; 687 break; 688 } 689 } 690 ierr = ISRestoreIndices(is_colors[i],&idxs_subproblems);CHKERRQ(ierr); 691 ierr = PetscSubcommCreate(PetscObjectComm((PetscObject)pc),&par_subcomm);CHKERRQ(ierr); 692 ierr = PetscSubcommSetNumber(par_subcomm,color_size+1);CHKERRQ(ierr); 693 ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)pc),&rank);CHKERRQ(ierr); 694 ierr = PetscSubcommSetTypeGeneral(par_subcomm,active_color,rank);CHKERRQ(ierr); 695 /* print debug info */ 696 if (pcbddc->dbg_flag) { 697 PetscMPIInt crank,csize; 698 ierr = MPI_Comm_rank(par_subcomm->comm,&crank);CHKERRQ(ierr); 699 ierr = MPI_Comm_size(par_subcomm->comm,&csize);CHKERRQ(ierr); 700 ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Color %d: size %d, details follows.\n",i,color_size);CHKERRQ(ierr); 701 ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 702 ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr); 703 ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer," Subdomain %d: color in subcomm %d (rank %d out of %d) (lidx %d)\n",PetscGlobalRank,par_subcomm->color,crank,csize,deluxe_ctx->par_col2sub[i]);CHKERRQ(ierr); 704 ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 705 } 706 707 if (deluxe_ctx->par_col2sub[i] >= 0) { 708 PC pc; 709 Mat color_mat,color_mat_is,temp_mat; 710 ISLocalToGlobalMapping WtoNmap,l2gmap_subset; 711 IS is_local_numbering,isB_local,isW_local,isW; 712 PCBDDCSubSchurs sub_schurs = deluxe_ctx->sub_schurs; 713 PetscInt subidx,n_local_dofs,n_global_dofs; 714 PetscInt *global_numbering,*local_numbering; 715 char ksp_prefix[256]; 716 size_t len; 717 718 /* Local index for schur complement on subset */ 719 subidx = deluxe_ctx->par_col2sub[i]; 720 721 /* Parallel numbering for dofs in colored subset */ 722 ierr = ISSum(sub_schurs->is_AEj_I[subidx],sub_schurs->is_AEj_B[subidx],&is_local_numbering);CHKERRQ(ierr); 723 ierr = ISGetLocalSize(is_local_numbering,&n_local_dofs);CHKERRQ(ierr); 724 ierr = ISGetIndices(is_local_numbering,(const PetscInt **)&local_numbering);CHKERRQ(ierr); 725 ierr = PCBDDCSubsetNumbering(par_subcomm->comm,pcbddc->mat_graph->l2gmap,n_local_dofs,local_numbering,PETSC_NULL,&n_global_dofs,&global_numbering);CHKERRQ(ierr); 726 ierr = ISRestoreIndices(is_local_numbering,(const PetscInt **)&local_numbering);CHKERRQ(ierr); 727 728 /* L2Gmap from relevant dofs to local dofs */ 729 ierr = ISLocalToGlobalMappingCreateIS(is_local_numbering,&WtoNmap);CHKERRQ(ierr); 730 731 /* L2Gmap from local to global dofs */ 732 ierr = ISLocalToGlobalMappingCreate(par_subcomm->comm,1,n_local_dofs,global_numbering,PETSC_COPY_VALUES,&l2gmap_subset);CHKERRQ(ierr); 733 734 /* compute parallel matrix (extended dirichlet problem on subset) */ 735 ierr = MatCreateIS(par_subcomm->comm,1,PETSC_DECIDE,PETSC_DECIDE,n_global_dofs,n_global_dofs,l2gmap_subset,&color_mat_is);CHKERRQ(ierr); 736 ierr = MatGetSubMatrix(pcbddc->local_mat,is_local_numbering,is_local_numbering,MAT_INITIAL_MATRIX,&temp_mat);CHKERRQ(ierr); 737 ierr = MatISSetLocalMat(color_mat_is,temp_mat);CHKERRQ(ierr); 738 ierr = MatDestroy(&temp_mat);CHKERRQ(ierr); 739 ierr = MatISGetMPIXAIJ(color_mat_is,MAT_INITIAL_MATRIX,&color_mat);CHKERRQ(ierr); 740 ierr = MatDestroy(&color_mat_is);CHKERRQ(ierr); 741 742 /* work vector for (parallel) extended dirichlet problem */ 743 ierr = MatCreateVecs(color_mat,&deluxe_ctx->par_vec[i],NULL);CHKERRQ(ierr); 744 745 /* compute scatters */ 746 /* deluxe_ctx->par_scctx_p[i] extension from local subset to extended dirichlet problem 747 deluxe_ctx->par_scctx_s[i] restriction from local boundary to subset -> simple copy of selected values */ 748 ierr = ISGlobalToLocalMappingApplyIS(pcbddc->BtoNmap,IS_GTOLM_DROP,sub_schurs->is_AEj_B[subidx],&isB_local);CHKERRQ(ierr); 749 ierr = VecScatterCreate(pcbddc->work_scaling,isB_local,sub_schurs->work1[subidx],NULL,&deluxe_ctx->par_scctx_s[i]);CHKERRQ(ierr); 750 ierr = ISGlobalToLocalMappingApplyIS(WtoNmap,IS_GTOLM_DROP,sub_schurs->is_AEj_B[subidx],&isW_local);CHKERRQ(ierr); 751 ierr = ISLocalToGlobalMappingApplyIS(l2gmap_subset,isW_local,&isW);CHKERRQ(ierr); 752 ierr = VecScatterCreate(sub_schurs->work1[subidx],NULL,deluxe_ctx->par_vec[i],isW,&deluxe_ctx->par_scctx_p[i]);CHKERRQ(ierr); 753 754 /* free objects no longer neeeded */ 755 ierr = ISDestroy(&isW);CHKERRQ(ierr); 756 ierr = ISDestroy(&isW_local);CHKERRQ(ierr); 757 ierr = ISDestroy(&isB_local);CHKERRQ(ierr); 758 ierr = ISLocalToGlobalMappingDestroy(&WtoNmap);CHKERRQ(ierr); 759 ierr = ISLocalToGlobalMappingDestroy(&l2gmap_subset);CHKERRQ(ierr); 760 ierr = ISDestroy(&is_local_numbering);CHKERRQ(ierr); 761 ierr = PetscFree(global_numbering);CHKERRQ(ierr); 762 763 /* KSP for extended dirichlet problem */ 764 ierr = KSPCreate(par_subcomm->comm,&deluxe_ctx->par_ksp[i]);CHKERRQ(ierr); 765 ierr = KSPSetOperators(deluxe_ctx->par_ksp[i],color_mat,color_mat);CHKERRQ(ierr); 766 ierr = KSPSetTolerances(deluxe_ctx->par_ksp[i],1.e-12,1.e-12,1.e10,10000);CHKERRQ(ierr); 767 ierr = KSPSetType(deluxe_ctx->par_ksp[i],KSPPREONLY);CHKERRQ(ierr); 768 ierr = KSPGetPC(deluxe_ctx->par_ksp[i],&pc);CHKERRQ(ierr); 769 ierr = PCSetType(pc,PCREDUNDANT);CHKERRQ(ierr); 770 ierr = PetscStrlen(((PetscObject)(pcbddc->ksp_D))->prefix,&len);CHKERRQ(ierr); 771 len -= 10; /* remove "dirichlet_" */ 772 ierr = PetscStrncpy(ksp_prefix,((PetscObject)(pcbddc->ksp_D))->prefix,len+1);CHKERRQ(ierr); /* PetscStrncpy puts a terminating char at the end */ 773 ierr = PetscStrcat(ksp_prefix,"deluxe_par_");CHKERRQ(ierr); 774 ierr = KSPSetOptionsPrefix(deluxe_ctx->par_ksp[i],ksp_prefix);CHKERRQ(ierr); 775 ierr = KSPSetFromOptions(deluxe_ctx->par_ksp[i]);CHKERRQ(ierr); 776 ierr = KSPSetUp(deluxe_ctx->par_ksp[i]);CHKERRQ(ierr); 777 ierr = MatDestroy(&color_mat);CHKERRQ(ierr); 778 } else { /* not partecipating in color */ 779 deluxe_ctx->par_ksp[i] = 0; 780 deluxe_ctx->par_vec[i] = 0; 781 deluxe_ctx->par_scctx_p[i] = 0; 782 deluxe_ctx->par_scctx_s[i] = 0; 783 } 784 ierr = PetscSubcommDestroy(&par_subcomm);CHKERRQ(ierr); 785 } 786 for (i=0;i<deluxe_ctx->par_colors;i++) { 787 ierr = ISDestroy(&is_colors[i]);CHKERRQ(ierr); 788 } 789 ierr = PetscFree(is_colors);CHKERRQ(ierr); 790 791 if (pcbddc->dbg_flag) { 792 Vec test_vec; 793 PetscReal error; 794 PCBDDCSubSchurs sub_schurs = deluxe_ctx->sub_schurs; 795 /* test partition of unity of coloured schur complements */ 796 for (i=0;i<deluxe_ctx->par_colors;i++) { 797 PetscInt subidx = deluxe_ctx->par_col2sub[i]; 798 PetscBool error_found = PETSC_FALSE; 799 ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr); 800 801 if (deluxe_ctx->par_ksp[i]) { 802 /* create random test vec being zero on internal nodes of the extende dirichlet problem */ 803 ierr = VecDuplicate(deluxe_ctx->par_vec[i],&test_vec);CHKERRQ(ierr); 804 ierr = VecSetRandom(sub_schurs->work1[subidx],PETSC_NULL);CHKERRQ(ierr); 805 ierr = VecSet(test_vec,0.0);CHKERRQ(ierr); 806 ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],sub_schurs->work1[subidx],test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 807 ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],sub_schurs->work1[subidx],test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 808 /* w_j */ 809 ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],test_vec,sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 810 ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],test_vec,sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 811 /* S_j*w_j */ 812 ierr = MatMult(sub_schurs->S_Ej[subidx],sub_schurs->work1[subidx],sub_schurs->work2[subidx]);CHKERRQ(ierr); 813 /* \sum_j S_j*w_j */ 814 ierr = VecSet(deluxe_ctx->par_vec[i],0.0);CHKERRQ(ierr); 815 ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],sub_schurs->work2[subidx],deluxe_ctx->par_vec[i],ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 816 ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],sub_schurs->work2[subidx],deluxe_ctx->par_vec[i],ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 817 /* (\sum_j S_j)^(-1)(\sum_j S_j*w_j) */ 818 ierr = KSPSolve(deluxe_ctx->par_ksp[i],deluxe_ctx->par_vec[i],deluxe_ctx->par_vec[i]);CHKERRQ(ierr); 819 ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 820 ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],deluxe_ctx->par_vec[i],sub_schurs->work1[subidx],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 821 ierr = VecSet(deluxe_ctx->par_vec[i],0.0);CHKERRQ(ierr); 822 ierr = VecScatterBegin(deluxe_ctx->par_scctx_p[i],sub_schurs->work1[subidx],deluxe_ctx->par_vec[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 823 ierr = VecScatterEnd(deluxe_ctx->par_scctx_p[i],sub_schurs->work1[subidx],deluxe_ctx->par_vec[i],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 824 /* test partition of unity */ 825 ierr = VecAXPY(test_vec,-1.0,deluxe_ctx->par_vec[i]);CHKERRQ(ierr); 826 ierr = VecNorm(test_vec,NORM_INFINITY,&error);CHKERRQ(ierr); 827 if (PetscAbsReal(error) > 1.e-2) { 828 /* ierr = VecView(test_vec,0);CHKERRQ(ierr); */ 829 error_found = PETSC_TRUE; 830 } 831 ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 832 } 833 if (error_found) { 834 ierr = PetscViewerASCIISynchronizedPrintf(pcbddc->dbg_viewer,"Error testing local schur for color %d and subdomain %d\n",i,PetscGlobalRank);CHKERRQ(ierr); 835 } 836 ierr = PetscViewerFlush(pcbddc->dbg_viewer);CHKERRQ(ierr); 837 } 838 } 839 PetscFunctionReturn(0); 840 } 841 842 843 #undef __FUNCT__ 844 #define __FUNCT__ "PCBDDCScalingSetUp_Deluxe_Seq" 845 static PetscErrorCode PCBDDCScalingSetUp_Deluxe_Seq(PC pc,PetscInt n_local_sequential_problems,PetscInt n_sequential_problems,PetscInt global_sequential[],PetscInt local_sequential[]) 846 { 847 PC_BDDC *pcbddc=(PC_BDDC*)pc->data; 848 PCBDDCDeluxeScaling deluxe_ctx=pcbddc->deluxe_ctx; 849 PCBDDCSubSchurs sub_schurs = deluxe_ctx->sub_schurs; 850 Mat global_schur_subsets,*submat_global_schur_subsets,work_mat; 851 IS is_to,is_from; 852 PetscScalar *array,*fill_vals; 853 PetscInt *all_local_idx_G,*all_local_idx_B,*all_local_idx_N,*all_permutation_G,*dummy_idx; 854 PetscInt i,j,k,local_problem_index; 855 PetscInt subset_size,max_subset_size,max_subset_size_red; 856 PetscInt local_size,global_size; 857 PC pc_temp; 858 MatSolverPackage solver=NULL; 859 char ksp_prefix[256]; 860 size_t len; 861 PetscErrorCode ierr; 862 863 PetscFunctionBegin; 864 if (!n_sequential_problems) { 865 PetscFunctionReturn(0); 866 } 867 /* Get info on subset sizes and sum of all subsets sizes */ 868 max_subset_size = 0; 869 local_size = 0; 870 for (i=0;i<n_local_sequential_problems;i++) { 871 local_problem_index = local_sequential[i]; 872 ierr = ISGetLocalSize(sub_schurs->is_AEj_B[local_problem_index],&subset_size);CHKERRQ(ierr); 873 max_subset_size = PetscMax(subset_size,max_subset_size); 874 local_size += subset_size; 875 } 876 877 /* Work arrays for local indices */ 878 ierr = PetscMalloc1(local_size,&all_local_idx_B);CHKERRQ(ierr); 879 ierr = PetscMalloc1(local_size,&all_local_idx_N);CHKERRQ(ierr); 880 881 /* Get local indices in local whole numbering and local boundary numbering */ 882 local_size = 0; 883 for (i=0;i<n_local_sequential_problems;i++) { 884 PetscInt *idxs; 885 /* get info on local problem */ 886 local_problem_index = local_sequential[i]; 887 ierr = ISGetLocalSize(sub_schurs->is_AEj_B[local_problem_index],&subset_size);CHKERRQ(ierr); 888 ierr = ISGetIndices(sub_schurs->is_AEj_B[local_problem_index],(const PetscInt**)&idxs);CHKERRQ(ierr); 889 /* subset indices in local numbering */ 890 ierr = PetscMemcpy(all_local_idx_N+local_size,idxs,subset_size*sizeof(PetscInt));CHKERRQ(ierr); 891 /* subset indices in local boundary numbering */ 892 ierr = ISGlobalToLocalMappingApply(pcbddc->BtoNmap,IS_GTOLM_DROP,subset_size,idxs,&j,&all_local_idx_B[local_size]);CHKERRQ(ierr); 893 ierr = ISRestoreIndices(sub_schurs->is_AEj_B[local_problem_index],(const PetscInt**)&idxs);CHKERRQ(ierr); 894 if (j != subset_size) { 895 SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in BDDC deluxe serial %d (BtoNmap)! %d != %d\n",local_problem_index,subset_size,j); 896 } 897 local_size += subset_size; 898 } 899 900 /* Number dofs on all subsets (parallel) and sort numbering */ 901 ierr = PCBDDCSubsetNumbering(PetscObjectComm((PetscObject)pc),pcbddc->mat_graph->l2gmap,local_size,all_local_idx_N,PETSC_NULL,&global_size,&all_local_idx_G);CHKERRQ(ierr); 902 ierr = PetscMalloc1(local_size,&all_permutation_G);CHKERRQ(ierr); 903 for (i=0;i<local_size;i++) { 904 all_permutation_G[i]=i; 905 } 906 ierr = PetscSortIntWithPermutation(local_size,all_local_idx_G,all_permutation_G);CHKERRQ(ierr); 907 908 /* Local matrix of all local Schur on subsets */ 909 ierr = MatCreate(PETSC_COMM_SELF,&deluxe_ctx->seq_mat);CHKERRQ(ierr); 910 ierr = MatSetSizes(deluxe_ctx->seq_mat,PETSC_DECIDE,PETSC_DECIDE,local_size,local_size);CHKERRQ(ierr); 911 ierr = MatSetType(deluxe_ctx->seq_mat,MATAIJ);CHKERRQ(ierr); 912 ierr = MatSeqAIJSetPreallocation(deluxe_ctx->seq_mat,max_subset_size,PETSC_NULL);CHKERRQ(ierr); 913 914 /* Global matrix of all assembled Schur on subsets */ 915 ierr = MatCreate(PetscObjectComm((PetscObject)pc),&global_schur_subsets);CHKERRQ(ierr); 916 ierr = MatSetSizes(global_schur_subsets,PETSC_DECIDE,PETSC_DECIDE,global_size,global_size);CHKERRQ(ierr); 917 ierr = MatSetType(global_schur_subsets,MATAIJ);CHKERRQ(ierr); 918 ierr = MPI_Allreduce(&max_subset_size,&max_subset_size_red,1,MPIU_INT,MPI_MAX,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr); 919 ierr = MatMPIAIJSetPreallocation(global_schur_subsets,max_subset_size_red,PETSC_NULL,max_subset_size_red,PETSC_NULL);CHKERRQ(ierr); 920 921 /* Work arrays */ 922 ierr = PetscMalloc2(max_subset_size,&dummy_idx,max_subset_size*max_subset_size,&fill_vals);CHKERRQ(ierr); 923 924 /* Loop on local problems to compute Schur complements explicitly */ 925 local_size = 0; 926 for (i=0;i<n_local_sequential_problems;i++) { 927 /* get info on local problem */ 928 local_problem_index = local_sequential[i]; 929 ierr = ISGetLocalSize(sub_schurs->is_AEj_B[local_problem_index],&subset_size);CHKERRQ(ierr); 930 /* local Schur */ 931 for (j=0;j<subset_size;j++) { 932 ierr = VecSet(sub_schurs->work1[local_problem_index],0.0);CHKERRQ(ierr); 933 ierr = VecSetValue(sub_schurs->work1[local_problem_index],j,1.0,INSERT_VALUES);CHKERRQ(ierr); 934 ierr = MatMult(sub_schurs->S_Ej[local_problem_index],sub_schurs->work1[local_problem_index],sub_schurs->work2[local_problem_index]);CHKERRQ(ierr); 935 /* store vals */ 936 ierr = VecGetArray(sub_schurs->work2[local_problem_index],&array);CHKERRQ(ierr); 937 for (k=0;k<subset_size;k++) { 938 fill_vals[k*subset_size+j] = array[k]; 939 } 940 ierr = VecRestoreArray(sub_schurs->work2[local_problem_index],&array);CHKERRQ(ierr); 941 } 942 for (j=0;j<subset_size;j++) { 943 dummy_idx[j]=local_size+j; 944 } 945 ierr = MatSetValues(deluxe_ctx->seq_mat,subset_size,dummy_idx,subset_size,dummy_idx,fill_vals,INSERT_VALUES);CHKERRQ(ierr); 946 ierr = MatSetValues(global_schur_subsets,subset_size,&all_local_idx_G[local_size],subset_size,&all_local_idx_G[local_size],fill_vals,ADD_VALUES);CHKERRQ(ierr); 947 local_size += subset_size; 948 } 949 ierr = MatAssemblyBegin(deluxe_ctx->seq_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 950 ierr = MatAssemblyEnd(deluxe_ctx->seq_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 951 ierr = MatAssemblyBegin(global_schur_subsets,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 952 ierr = MatAssemblyEnd(global_schur_subsets,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 953 ierr = PetscFree2(dummy_idx,fill_vals);CHKERRQ(ierr); 954 955 /* Create work vectors for sequential part of deluxe */ 956 ierr = MatCreateVecs(deluxe_ctx->seq_mat,&deluxe_ctx->seq_work1,&deluxe_ctx->seq_work2);CHKERRQ(ierr); 957 958 /* Compute deluxe sequential scatter */ 959 ierr = ISCreateGeneral(PETSC_COMM_SELF,local_size,all_local_idx_B,PETSC_OWN_POINTER,&is_from);CHKERRQ(ierr); 960 ierr = VecScatterCreate(pcbddc->work_scaling,is_from,deluxe_ctx->seq_work1,NULL,&deluxe_ctx->seq_scctx);CHKERRQ(ierr); 961 ierr = ISDestroy(&is_from);CHKERRQ(ierr); 962 963 /* Get local part of (\sum_j S_Ej) */ 964 for (i=0;i<local_size;i++) { 965 all_local_idx_N[i] = all_local_idx_G[all_permutation_G[i]]; 966 } 967 ierr = ISCreateGeneral(PetscObjectComm((PetscObject)pc),local_size,all_local_idx_N,PETSC_OWN_POINTER,&is_to);CHKERRQ(ierr); 968 ierr = MatGetSubMatrices(global_schur_subsets,1,&is_to,&is_to,MAT_INITIAL_MATRIX,&submat_global_schur_subsets);CHKERRQ(ierr); 969 ierr = MatDestroy(&global_schur_subsets);CHKERRQ(ierr); 970 ierr = ISDestroy(&is_to);CHKERRQ(ierr); 971 for (i=0;i<local_size;i++) { 972 all_local_idx_G[all_permutation_G[i]] = i; 973 } 974 ierr = ISCreateGeneral(PETSC_COMM_SELF,local_size,all_local_idx_G,PETSC_OWN_POINTER,&is_from);CHKERRQ(ierr); 975 ierr = ISSetPermutation(is_from);CHKERRQ(ierr); 976 ierr = MatPermute(submat_global_schur_subsets[0],is_from,is_from,&work_mat);CHKERRQ(ierr); 977 ierr = MatDestroyMatrices(1,&submat_global_schur_subsets);CHKERRQ(ierr); 978 ierr = ISDestroy(&is_from);CHKERRQ(ierr); 979 ierr = PetscFree(all_permutation_G);CHKERRQ(ierr); 980 981 /* Create KSP object for sequential part of deluxe scaling */ 982 ierr = KSPCreate(PETSC_COMM_SELF,&deluxe_ctx->seq_ksp);CHKERRQ(ierr); 983 ierr = KSPSetOperators(deluxe_ctx->seq_ksp,work_mat,work_mat);CHKERRQ(ierr); 984 ierr = KSPSetType(deluxe_ctx->seq_ksp,KSPPREONLY);CHKERRQ(ierr); 985 ierr = KSPGetPC(deluxe_ctx->seq_ksp,&pc_temp);CHKERRQ(ierr); 986 ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 987 ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 988 ierr = PCFactorGetMatSolverPackage(pc_temp,(const MatSolverPackage*)&solver);CHKERRQ(ierr); 989 if (solver) { 990 PC new_pc; 991 PCType type; 992 ierr = PCGetType(pc_temp,&type);CHKERRQ(ierr); 993 ierr = KSPGetPC(deluxe_ctx->seq_ksp,&new_pc);CHKERRQ(ierr); 994 ierr = PCSetType(new_pc,type);CHKERRQ(ierr); 995 ierr = PCFactorSetMatSolverPackage(new_pc,solver);CHKERRQ(ierr); 996 } 997 ierr = PetscStrlen(((PetscObject)(pcbddc->ksp_D))->prefix,&len);CHKERRQ(ierr); 998 len -= 10; /* remove "dirichlet_" */ 999 ierr = PetscStrncpy(ksp_prefix,((PetscObject)(pcbddc->ksp_D))->prefix,len+1);CHKERRQ(ierr); 1000 ierr = PetscStrcat(ksp_prefix,"deluxe_seq_");CHKERRQ(ierr); 1001 ierr = KSPSetOptionsPrefix(deluxe_ctx->seq_ksp,ksp_prefix);CHKERRQ(ierr); 1002 ierr = KSPSetFromOptions(deluxe_ctx->seq_ksp);CHKERRQ(ierr); 1003 ierr = KSPSetUp(deluxe_ctx->seq_ksp);CHKERRQ(ierr); 1004 ierr = MatDestroy(&work_mat);CHKERRQ(ierr); 1005 PetscFunctionReturn(0); 1006 } 1007