Actual source code: tfs.c

  1: /*
  2:         Provides an interface to the Tufo-Fischer parallel direct solver
  3: */

  5: #include <petsc/private/pcimpl.h>
  6: #include <../src/mat/impls/aij/mpi/mpiaij.h>
  7: #include <../src/ksp/pc/impls/tfs/tfs.h>

  9: typedef struct {
 10:   xxt_ADT  xxt;
 11:   xyt_ADT  xyt;
 12:   Vec      b, xd, xo;
 13:   PetscInt nd;
 14: } PC_TFS;

 16: static PetscErrorCode PCDestroy_TFS(PC pc)
 17: {
 18:   PC_TFS *tfs = (PC_TFS *)pc->data;

 20:   PetscFunctionBegin;
 21:   /* free the XXT datastructures */
 22:   if (tfs->xxt) PetscCall(XXT_free(tfs->xxt));
 23:   if (tfs->xyt) PetscCall(XYT_free(tfs->xyt));
 24:   PetscCall(VecDestroy(&tfs->b));
 25:   PetscCall(VecDestroy(&tfs->xd));
 26:   PetscCall(VecDestroy(&tfs->xo));
 27:   PetscCall(PetscFree(pc->data));
 28:   PetscFunctionReturn(PETSC_SUCCESS);
 29: }

 31: static PetscErrorCode PCApply_TFS_XXT(PC pc, Vec x, Vec y)
 32: {
 33:   PC_TFS            *tfs = (PC_TFS *)pc->data;
 34:   PetscScalar       *yy;
 35:   const PetscScalar *xx;

 37:   PetscFunctionBegin;
 38:   PetscCall(VecGetArrayRead(x, &xx));
 39:   PetscCall(VecGetArray(y, &yy));
 40:   PetscCall(XXT_solve(tfs->xxt, yy, (PetscScalar *)xx));
 41:   PetscCall(VecRestoreArrayRead(x, &xx));
 42:   PetscCall(VecRestoreArray(y, &yy));
 43:   PetscFunctionReturn(PETSC_SUCCESS);
 44: }

 46: static PetscErrorCode PCApply_TFS_XYT(PC pc, Vec x, Vec y)
 47: {
 48:   PC_TFS            *tfs = (PC_TFS *)pc->data;
 49:   PetscScalar       *yy;
 50:   const PetscScalar *xx;

 52:   PetscFunctionBegin;
 53:   PetscCall(VecGetArrayRead(x, &xx));
 54:   PetscCall(VecGetArray(y, &yy));
 55:   PetscCall(XYT_solve(tfs->xyt, yy, (PetscScalar *)xx));
 56:   PetscCall(VecRestoreArrayRead(x, &xx));
 57:   PetscCall(VecRestoreArray(y, &yy));
 58:   PetscFunctionReturn(PETSC_SUCCESS);
 59: }

 61: static PetscErrorCode PCTFSLocalMult_TFS(PC pc, PetscScalar *xin, PetscScalar *xout)
 62: {
 63:   PC_TFS     *tfs = (PC_TFS *)pc->data;
 64:   Mat         A   = pc->pmat;
 65:   Mat_MPIAIJ *a   = (Mat_MPIAIJ *)A->data;

 67:   PetscFunctionBegin;
 68:   PetscCall(VecPlaceArray(tfs->b, xout));
 69:   PetscCall(VecPlaceArray(tfs->xd, xin));
 70:   PetscCall(VecPlaceArray(tfs->xo, xin + tfs->nd));
 71:   PetscCall(MatMult(a->A, tfs->xd, tfs->b));
 72:   PetscCall(MatMultAdd(a->B, tfs->xo, tfs->b, tfs->b));
 73:   PetscCall(VecResetArray(tfs->b));
 74:   PetscCall(VecResetArray(tfs->xd));
 75:   PetscCall(VecResetArray(tfs->xo));
 76:   PetscFunctionReturn(PETSC_SUCCESS);
 77: }

 79: static PetscErrorCode PCSetUp_TFS(PC pc)
 80: {
 81:   PC_TFS     *tfs = (PC_TFS *)pc->data;
 82:   Mat         A   = pc->pmat;
 83:   Mat_MPIAIJ *a   = (Mat_MPIAIJ *)A->data;
 84:   PetscInt   *localtoglobal, ncol, i;
 85:   PetscBool   ismpiaij;

 87:   /*
 88:   PetscBool      issymmetric;
 89:   Petsc Real tol = 0.0;
 90:   */

 92:   PetscFunctionBegin;
 93:   PetscCheck(A->cmap->N == A->rmap->N, PetscObjectComm((PetscObject)pc), PETSC_ERR_ARG_SIZ, "matrix must be square");
 94:   PetscCall(PetscObjectTypeCompare((PetscObject)pc->pmat, MATMPIAIJ, &ismpiaij));
 95:   PetscCheck(ismpiaij, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Currently only supports MPIAIJ matrices");

 97:   /* generate the local to global mapping */
 98:   ncol = a->A->cmap->n + a->B->cmap->n;
 99:   PetscCall(PetscMalloc1(ncol, &localtoglobal));
100:   for (i = 0; i < a->A->cmap->n; i++) localtoglobal[i] = A->cmap->rstart + i + 1;
101:   for (i = 0; i < a->B->cmap->n; i++) localtoglobal[i + a->A->cmap->n] = a->garray[i] + 1;

103:   /* generate the vectors needed for the local solves */
104:   PetscCall(VecCreateSeqWithArray(PETSC_COMM_SELF, 1, a->A->rmap->n, NULL, &tfs->b));
105:   PetscCall(VecCreateSeqWithArray(PETSC_COMM_SELF, 1, a->A->cmap->n, NULL, &tfs->xd));
106:   PetscCall(VecCreateSeqWithArray(PETSC_COMM_SELF, 1, a->B->cmap->n, NULL, &tfs->xo));
107:   tfs->nd = a->A->cmap->n;

109:   /*  ierr =  MatIsSymmetric(A,tol,&issymmetric); */
110:   /*  if (issymmetric) { */
111:   PetscCall(PetscBarrier((PetscObject)pc));
112:   if (A->symmetric == PETSC_BOOL3_TRUE) {
113:     tfs->xxt = XXT_new();
114:     PetscCall(XXT_factor(tfs->xxt, localtoglobal, A->rmap->n, ncol, (PetscErrorCode (*)(void *, PetscScalar *, PetscScalar *))PCTFSLocalMult_TFS, pc));
115:     pc->ops->apply = PCApply_TFS_XXT;
116:   } else {
117:     tfs->xyt = XYT_new();
118:     PetscCall(XYT_factor(tfs->xyt, localtoglobal, A->rmap->n, ncol, (PetscErrorCode (*)(void *, PetscScalar *, PetscScalar *))PCTFSLocalMult_TFS, pc));
119:     pc->ops->apply = PCApply_TFS_XYT;
120:   }

122:   PetscCall(PetscFree(localtoglobal));
123:   PetscFunctionReturn(PETSC_SUCCESS);
124: }

126: static PetscErrorCode PCSetFromOptions_TFS(PC pc, PetscOptionItems *PetscOptionsObject)
127: {
128:   PetscFunctionBegin;
129:   PetscFunctionReturn(PETSC_SUCCESS);
130: }
131: static PetscErrorCode PCView_TFS(PC pc, PetscViewer viewer)
132: {
133:   PetscFunctionBegin;
134:   PetscFunctionReturn(PETSC_SUCCESS);
135: }

137: /*MC
138:      PCTFS - A parallel direct solver intended for problems with very few unknowns (like the
139:          coarse grid in multigrid). Performs a Cholesky or LU factorization of a matrix defined by
140:          its local matrix-vector product.

142:    Level: beginner

144:    Notes:
145:     Only implemented for the `MATMPIAIJ` matrices

147:     Only works on a solver object that lives on all of `PETSC_COMM_WORLD`!

149:     Only works for real numbers (is not built if `PetscScalar` is complex)

151:    Implemented by  Henry M. Tufo III and Paul Fischer originally for Nek5000 and called XXT or XYT

153: .seealso: [](ch_ksp), `PCCreate()`, `PCSetType()`, `PCType`, `PC`
154: M*/
155: PETSC_EXTERN PetscErrorCode PCCreate_TFS(PC pc)
156: {
157:   PC_TFS     *tfs;
158:   PetscMPIInt cmp;

160:   PetscFunctionBegin;
161:   PetscCallMPI(MPI_Comm_compare(PETSC_COMM_WORLD, PetscObjectComm((PetscObject)pc), &cmp));
162:   PetscCheck(cmp == MPI_IDENT || cmp == MPI_CONGRUENT, PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "TFS only works with PETSC_COMM_WORLD objects");
163:   PetscCall(PetscNew(&tfs));

165:   tfs->xxt = NULL;
166:   tfs->xyt = NULL;
167:   tfs->b   = NULL;
168:   tfs->xd  = NULL;
169:   tfs->xo  = NULL;
170:   tfs->nd  = 0;

172:   pc->ops->apply               = NULL;
173:   pc->ops->applytranspose      = NULL;
174:   pc->ops->setup               = PCSetUp_TFS;
175:   pc->ops->destroy             = PCDestroy_TFS;
176:   pc->ops->setfromoptions      = PCSetFromOptions_TFS;
177:   pc->ops->view                = PCView_TFS;
178:   pc->ops->applyrichardson     = NULL;
179:   pc->ops->applysymmetricleft  = NULL;
180:   pc->ops->applysymmetricright = NULL;
181:   pc->data                     = (void *)tfs;
182:   PetscFunctionReturn(PETSC_SUCCESS);
183: }