/* Defines a Eisenstat trick SSOR preconditioner. This uses about %50 of the usual amount of floating point ops used for SSOR + Krylov method. But it requires actually solving the preconditioned problem with both left and right preconditioning. */ #include /*I "petscpc.h" I*/ typedef struct { Mat shell,A; Vec b[2],diag; /* temporary storage for true right hand side */ PetscReal omega; PetscBool usediag; /* indicates preconditioner should include diagonal scaling*/ } PC_Eisenstat; #undef __FUNCT__ #define __FUNCT__ "PCMult_Eisenstat" static PetscErrorCode PCMult_Eisenstat(Mat mat,Vec b,Vec x) { PetscErrorCode ierr; PC pc; PC_Eisenstat *eis; PetscFunctionBegin; ierr = MatShellGetContext(mat,(void**)&pc);CHKERRQ(ierr); eis = (PC_Eisenstat*)pc->data; ierr = MatSOR(eis->A,b,eis->omega,SOR_EISENSTAT,0.0,1,1,x);CHKERRQ(ierr); PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCApply_Eisenstat" static PetscErrorCode PCApply_Eisenstat(PC pc,Vec x,Vec y) { PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscErrorCode ierr; PetscBool hasop; PetscFunctionBegin; if (eis->usediag) { ierr = MatHasOperation(pc->pmat,MATOP_MULT_DIAGONAL_BLOCK,&hasop);CHKERRQ(ierr); if (hasop) { ierr = MatMultDiagonalBlock(pc->pmat,x,y);CHKERRQ(ierr); } else { ierr = VecPointwiseMult(y,x,eis->diag);CHKERRQ(ierr); } } else {ierr = VecCopy(x,y);CHKERRQ(ierr);} PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCPreSolve_Eisenstat" static PetscErrorCode PCPreSolve_Eisenstat(PC pc,KSP ksp,Vec b,Vec x) { PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscBool nonzero; PetscErrorCode ierr; PetscFunctionBegin; if (pc->presolvedone < 2) { if (pc->mat != pc->pmat) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_SUP,"Cannot have different mat and pmat"); /* swap shell matrix and true matrix */ eis->A = pc->mat; pc->mat = eis->shell; } if (!eis->b[pc->presolvedone-1]) { ierr = VecDuplicate(b,&eis->b[pc->presolvedone-1]);CHKERRQ(ierr); ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)eis->b[pc->presolvedone-1]);CHKERRQ(ierr); } /* if nonzero initial guess, modify x */ ierr = KSPGetInitialGuessNonzero(ksp,&nonzero);CHKERRQ(ierr); if (nonzero) { ierr = VecCopy(x,eis->b[pc->presolvedone-1]);CHKERRQ(ierr); ierr = MatSOR(eis->A,eis->b[pc->presolvedone-1],eis->omega,SOR_APPLY_UPPER,0.0,1,1,x);CHKERRQ(ierr); } /* save true b, other option is to swap pointers */ ierr = VecCopy(b,eis->b[pc->presolvedone-1]);CHKERRQ(ierr); /* modify b by (L + D/omega)^{-1} */ ierr = MatSOR(eis->A,eis->b[pc->presolvedone-1],eis->omega,(MatSORType)(SOR_ZERO_INITIAL_GUESS | SOR_LOCAL_FORWARD_SWEEP),0.0,1,1,b);CHKERRQ(ierr); PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCPostSolve_Eisenstat" static PetscErrorCode PCPostSolve_Eisenstat(PC pc,KSP ksp,Vec b,Vec x) { PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscErrorCode ierr; PetscFunctionBegin; /* get back true b */ ierr = VecCopy(eis->b[pc->presolvedone],b);CHKERRQ(ierr); /* modify x by (U + D/omega)^{-1} */ ierr = VecCopy(x,eis->b[pc->presolvedone]);CHKERRQ(ierr); ierr = MatSOR(eis->A,eis->b[pc->presolvedone],eis->omega,(MatSORType)(SOR_ZERO_INITIAL_GUESS | SOR_LOCAL_BACKWARD_SWEEP),0.0,1,1,x);CHKERRQ(ierr); if (!pc->presolvedone) pc->mat = eis->A; PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCReset_Eisenstat" static PetscErrorCode PCReset_Eisenstat(PC pc) { PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscErrorCode ierr; PetscFunctionBegin; ierr = VecDestroy(&eis->b[0]);CHKERRQ(ierr); ierr = VecDestroy(&eis->b[1]);CHKERRQ(ierr); ierr = MatDestroy(&eis->shell);CHKERRQ(ierr); ierr = VecDestroy(&eis->diag);CHKERRQ(ierr); PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCDestroy_Eisenstat" static PetscErrorCode PCDestroy_Eisenstat(PC pc) { PetscErrorCode ierr; PetscFunctionBegin; ierr = PCReset_Eisenstat(pc);CHKERRQ(ierr); ierr = PetscFree(pc->data);CHKERRQ(ierr); PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCSetFromOptions_Eisenstat" static PetscErrorCode PCSetFromOptions_Eisenstat(PetscOptions *PetscOptionsObject,PC pc) { PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscErrorCode ierr; PetscBool set,flg; PetscFunctionBegin; ierr = PetscOptionsHead(PetscOptionsObject,"Eisenstat SSOR options");CHKERRQ(ierr); ierr = PetscOptionsReal("-pc_eisenstat_omega","Relaxation factor 0 < omega < 2","PCEisenstatSetOmega",eis->omega,&eis->omega,NULL);CHKERRQ(ierr); ierr = PetscOptionsBool("-pc_eisenstat_no_diagonal_scaling","Do not use standard diagonal scaling","PCEisenstatSetNoDiagonalScaling",eis->usediag ? PETSC_FALSE : PETSC_TRUE,&flg,&set);CHKERRQ(ierr); if (set) { ierr = PCEisenstatSetNoDiagonalScaling(pc,flg);CHKERRQ(ierr); } ierr = PetscOptionsTail();CHKERRQ(ierr); PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCView_Eisenstat" static PetscErrorCode PCView_Eisenstat(PC pc,PetscViewer viewer) { PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscErrorCode ierr; PetscBool iascii; PetscFunctionBegin; ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); if (iascii) { ierr = PetscViewerASCIIPrintf(viewer,"Eisenstat: omega = %g\n",(double)eis->omega);CHKERRQ(ierr); if (eis->usediag) { ierr = PetscViewerASCIIPrintf(viewer,"Eisenstat: Using diagonal scaling (default)\n");CHKERRQ(ierr); } else { ierr = PetscViewerASCIIPrintf(viewer,"Eisenstat: Not using diagonal scaling\n");CHKERRQ(ierr); } } PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCSetUp_Eisenstat" static PetscErrorCode PCSetUp_Eisenstat(PC pc) { PetscErrorCode ierr; PetscInt M,N,m,n; PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscFunctionBegin; if (!pc->setupcalled) { ierr = MatGetSize(pc->mat,&M,&N);CHKERRQ(ierr); ierr = MatGetLocalSize(pc->mat,&m,&n);CHKERRQ(ierr); ierr = MatCreate(PetscObjectComm((PetscObject)pc),&eis->shell);CHKERRQ(ierr); ierr = MatSetSizes(eis->shell,m,n,M,N);CHKERRQ(ierr); ierr = MatSetType(eis->shell,MATSHELL);CHKERRQ(ierr); ierr = MatSetUp(eis->shell);CHKERRQ(ierr); ierr = MatShellSetContext(eis->shell,(void*)pc);CHKERRQ(ierr); ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)eis->shell);CHKERRQ(ierr); ierr = MatShellSetOperation(eis->shell,MATOP_MULT,(void (*)(void))PCMult_Eisenstat);CHKERRQ(ierr); } if (!eis->usediag) PetscFunctionReturn(0); if (!pc->setupcalled) { ierr = MatCreateVecs(pc->pmat,&eis->diag,0);CHKERRQ(ierr); ierr = PetscLogObjectParent((PetscObject)pc,(PetscObject)eis->diag);CHKERRQ(ierr); } ierr = MatGetDiagonal(pc->pmat,eis->diag);CHKERRQ(ierr); PetscFunctionReturn(0); } /* --------------------------------------------------------------------*/ #undef __FUNCT__ #define __FUNCT__ "PCEisenstatSetOmega_Eisenstat" static PetscErrorCode PCEisenstatSetOmega_Eisenstat(PC pc,PetscReal omega) { PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscFunctionBegin; if (omega >= 2.0 || omega <= 0.0) SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_ARG_OUTOFRANGE,"Relaxation out of range"); eis->omega = omega; PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCEisenstatSetNoDiagonalScaling_Eisenstat" static PetscErrorCode PCEisenstatSetNoDiagonalScaling_Eisenstat(PC pc,PetscBool flg) { PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscFunctionBegin; eis->usediag = flg; PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCEisenstatGetOmega_Eisenstat" static PetscErrorCode PCEisenstatGetOmega_Eisenstat(PC pc,PetscReal *omega) { PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscFunctionBegin; *omega = eis->omega; PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCEisenstatGetNoDiagonalScaling_Eisenstat" static PetscErrorCode PCEisenstatGetNoDiagonalScaling_Eisenstat(PC pc,PetscBool *flg) { PC_Eisenstat *eis = (PC_Eisenstat*)pc->data; PetscFunctionBegin; *flg = eis->usediag; PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCEisenstatSetOmega" /*@ PCEisenstatSetOmega - Sets the SSOR relaxation coefficient, omega, to use with Eisenstat's trick (where omega = 1.0 by default). Logically Collective on PC Input Parameters: + pc - the preconditioner context - omega - relaxation coefficient (0 < omega < 2) Options Database Key: . -pc_eisenstat_omega - Sets omega Notes: The Eisenstat trick implementation of SSOR requires about 50% of the usual amount of floating point operations used for SSOR + Krylov method; however, the preconditioned problem must be solved with both left and right preconditioning. To use SSOR without the Eisenstat trick, employ the PCSOR preconditioner, which can be chosen with the database options $ -pc_type sor -pc_sor_symmetric Level: intermediate .keywords: PC, Eisenstat, set, SOR, SSOR, relaxation, omega .seealso: PCSORSetOmega() @*/ PetscErrorCode PCEisenstatSetOmega(PC pc,PetscReal omega) { PetscErrorCode ierr; PetscFunctionBegin; PetscValidHeaderSpecific(pc,PC_CLASSID,1); PetscValidLogicalCollectiveReal(pc,omega,2); ierr = PetscTryMethod(pc,"PCEisenstatSetOmega_C",(PC,PetscReal),(pc,omega));CHKERRQ(ierr); PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCEisenstatSetNoDiagonalScaling" /*@ PCEisenstatSetNoDiagonalScaling - Causes the Eisenstat preconditioner not to do additional diagonal preconditioning. For matrices with a constant along the diagonal, this may save a small amount of work. Logically Collective on PC Input Parameters: + pc - the preconditioner context - flg - PETSC_TRUE turns off diagonal scaling inside the algorithm Options Database Key: . -pc_eisenstat_no_diagonal_scaling - Activates PCEisenstatSetNoDiagonalScaling() Level: intermediate Note: If you use the KPSSetDiagonalScaling() or -ksp_diagonal_scale option then you will likley want to use this routine since it will save you some unneeded flops. .keywords: PC, Eisenstat, use, diagonal, scaling, SSOR .seealso: PCEisenstatSetOmega() @*/ PetscErrorCode PCEisenstatSetNoDiagonalScaling(PC pc,PetscBool flg) { PetscErrorCode ierr; PetscFunctionBegin; PetscValidHeaderSpecific(pc,PC_CLASSID,1); ierr = PetscTryMethod(pc,"PCEisenstatSetNoDiagonalScaling_C",(PC,PetscBool),(pc,flg));CHKERRQ(ierr); PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCEisenstatGetOmega" /*@ PCEisenstatGetOmega - Gets the SSOR relaxation coefficient, omega, to use with Eisenstat's trick (where omega = 1.0 by default). Logically Collective on PC Input Parameter: . pc - the preconditioner context Output Parameter: . omega - relaxation coefficient (0 < omega < 2) Options Database Key: . -pc_eisenstat_omega - Sets omega Notes: The Eisenstat trick implementation of SSOR requires about 50% of the usual amount of floating point operations used for SSOR + Krylov method; however, the preconditioned problem must be solved with both left and right preconditioning. To use SSOR without the Eisenstat trick, employ the PCSOR preconditioner, which can be chosen with the database options $ -pc_type sor -pc_sor_symmetric Level: intermediate .keywords: PC, Eisenstat, set, SOR, SSOR, relaxation, omega .seealso: PCSORGetOmega(), PCEisenstatSetOmega() @*/ PetscErrorCode PCEisenstatGetOmega(PC pc,PetscReal *omega) { PetscErrorCode ierr; PetscFunctionBegin; PetscValidHeaderSpecific(pc,PC_CLASSID,1); ierr = PetscUseMethod(pc,"PCEisenstatGetOmega_C",(PC,PetscReal*),(pc,omega));CHKERRQ(ierr); PetscFunctionReturn(0); } #undef __FUNCT__ #define __FUNCT__ "PCEisenstatGetNoDiagonalScaling" /*@ PCEisenstatGetNoDiagonalScaling - Causes the Eisenstat preconditioner not to do additional diagonal preconditioning. For matrices with a constant along the diagonal, this may save a small amount of work. Logically Collective on PC Input Parameter: . pc - the preconditioner context Output Parameter: . flg - PETSC_TRUE means there is no diagonal scaling applied Options Database Key: . -pc_eisenstat_no_diagonal_scaling - Activates PCEisenstatSetNoDiagonalScaling() Level: intermediate Note: If you use the KPSSetDiagonalScaling() or -ksp_diagonal_scale option then you will likley want to use this routine since it will save you some unneeded flops. .keywords: PC, Eisenstat, use, diagonal, scaling, SSOR .seealso: PCEisenstatGetOmega() @*/ PetscErrorCode PCEisenstatGetNoDiagonalScaling(PC pc,PetscBool *flg) { PetscErrorCode ierr; PetscFunctionBegin; PetscValidHeaderSpecific(pc,PC_CLASSID,1); ierr = PetscTryMethod(pc,"PCEisenstatGetNoDiagonalScaling_C",(PC,PetscBool*),(pc,flg));CHKERRQ(ierr); PetscFunctionReturn(0); } /* --------------------------------------------------------------------*/ /*MC PCEISENSTAT - An implementation of SSOR (symmetric successive over relaxation, symmetric Gauss-Seidel) preconditioning that incorporates Eisenstat's trick to reduce the amount of computation needed. Options Database Keys: + -pc_eisenstat_omega - Sets omega - -pc_eisenstat_no_diagonal_scaling - Activates PCEisenstatSetNoDiagonalScaling() Level: beginner Concepts: SOR, preconditioners, Gauss-Seidel, Eisenstat's trick Notes: Only implemented for the SeqAIJ matrix format. Not a true parallel SOR, in parallel this implementation corresponds to block Jacobi with SOR on each block. .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PC, PCEisenstatSetNoDiagonalScaling(), PCEisenstatSetOmega(), PCSOR M*/ #undef __FUNCT__ #define __FUNCT__ "PCCreate_Eisenstat" PETSC_EXTERN PetscErrorCode PCCreate_Eisenstat(PC pc) { PetscErrorCode ierr; PC_Eisenstat *eis; PetscFunctionBegin; ierr = PetscNewLog(pc,&eis);CHKERRQ(ierr); pc->ops->apply = PCApply_Eisenstat; pc->ops->presolve = PCPreSolve_Eisenstat; pc->ops->postsolve = PCPostSolve_Eisenstat; pc->ops->applyrichardson = 0; pc->ops->setfromoptions = PCSetFromOptions_Eisenstat; pc->ops->destroy = PCDestroy_Eisenstat; pc->ops->reset = PCReset_Eisenstat; pc->ops->view = PCView_Eisenstat; pc->ops->setup = PCSetUp_Eisenstat; pc->data = (void*)eis; eis->omega = 1.0; eis->b[0] = 0; eis->b[1] = 0; eis->diag = 0; eis->usediag = PETSC_TRUE; ierr = PetscObjectComposeFunction((PetscObject)pc,"PCEisenstatSetOmega_C",PCEisenstatSetOmega_Eisenstat);CHKERRQ(ierr); ierr = PetscObjectComposeFunction((PetscObject)pc,"PCEisenstatSetNoDiagonalScaling_C",PCEisenstatSetNoDiagonalScaling_Eisenstat);CHKERRQ(ierr); ierr = PetscObjectComposeFunction((PetscObject)pc,"PCEisenstatGetOmega_C",PCEisenstatGetOmega_Eisenstat);CHKERRQ(ierr); ierr = PetscObjectComposeFunction((PetscObject)pc,"PCEisenstatGetNoDiagonalScaling_C",PCEisenstatGetNoDiagonalScaling_Eisenstat);CHKERRQ(ierr); PetscFunctionReturn(0); }