Actual source code: stag2d.c
petsc-3.13.6 2020-09-29
1: /* Functions specific to the 2-dimensional implementation of DMStag */
2: #include <petsc/private/dmstagimpl.h>
4: /*@C
5: DMStagCreate2d - Create an object to manage data living on the faces, edges, and vertices of a parallelized regular 2D grid.
7: Collective
9: Input Parameters:
10: + comm - MPI communicator
11: . bndx,bndy - boundary type: DM_BOUNDARY_NONE, DM_BOUNDARY_PERIODIC, or DM_BOUNDARY_GHOSTED
12: . M,N - global number of grid points in x,y directions
13: . m,n - number of ranks in the x,y directions (may be PETSC_DECIDE)
14: . dof0 - number of degrees of freedom per vertex/point/node/0-cell
15: . dof1 - number of degrees of freedom per edge/1-cell
16: . dof2 - number of degrees of freedom per element/2-cell
17: . stencilType - ghost/halo region type: DMSTAG_STENCIL_NONE, DMSTAG_STENCIL_BOX, or DMSTAG_STENCIL_STAR
18: . stencilWidth - width, in elements, of halo/ghost region
19: - lx,ly - arrays of local x,y element counts, of length equal to m,n, summing to M,N
21: Output Parameter:
22: . dm - the new DMStag object
24: Options Database Keys:
25: + -dm_view - calls DMViewFromOptions() a the conclusion of DMSetUp()
26: . -stag_grid_x <nx> - number of elements in the x direction
27: . -stag_grid_y <ny> - number of elements in the y direction
28: . -stag_ranks_x <rx> - number of ranks in the x direction
29: . -stag_ranks_y <ry> - number of ranks in the y direction
30: . -stag_ghost_stencil_width - width of ghost region, in elements
31: . -stag_boundary_type_x <none,ghosted,periodic> - DMBoundaryType value
32: - -stag_boundary_type_y <none,ghosted,periodic> - DMBoundaryType value
34: Notes:
35: You must call DMSetUp() after this call, before using the DM.
36: If you wish to use the options database (see the keys above) to change values in the DMStag, you must call
37: DMSetFromOptions() after this function but before DMSetUp().
39: Level: beginner
41: .seealso: DMSTAG, DMStagCreate1d(), DMStagCreate3d(), DMDestroy(), DMView(), DMCreateGlobalVector(), DMCreateLocalVector(), DMLocalToGlobalBegin(), DMDACreate2d()
42: @*/
43: PETSC_EXTERN PetscErrorCode DMStagCreate2d(MPI_Comm comm, DMBoundaryType bndx,DMBoundaryType bndy, PetscInt M,PetscInt N, PetscInt m,PetscInt n, PetscInt dof0, PetscInt dof1, PetscInt dof2, DMStagStencilType stencilType, PetscInt stencilWidth, const PetscInt lx[], const PetscInt ly[],DM* dm)
44: {
48: DMCreate(comm,dm);
49: DMSetDimension(*dm,2);
50: DMStagInitialize(bndx,bndy,DM_BOUNDARY_NONE,M,N,0,m,n,0,dof0,dof1,dof2,0,stencilType,stencilWidth,lx,ly,NULL,*dm);
51: return(0);
52: }
54: PETSC_INTERN PetscErrorCode DMStagSetUniformCoordinatesExplicit_2d(DM dm,PetscReal xmin,PetscReal xmax,PetscReal ymin,PetscReal ymax)
55: {
57: DM_Stag *stagCoord;
58: DM dmCoord;
59: Vec coordLocal,coord;
60: PetscReal h[2],min[2];
61: PetscScalar ***arr;
62: PetscInt ind[2],start[2],n[2],nExtra[2],s,c;
63: PetscInt idownleft,idown,ileft,ielement;
66: DMGetCoordinateDM(dm, &dmCoord);
67: stagCoord = (DM_Stag*) dmCoord->data;
68: for (s=0; s<3; ++s) {
69: if (stagCoord->dof[s] !=0 && stagCoord->dof[s] != 2) SETERRQ2(PetscObjectComm((PetscObject)dm),PETSC_ERR_PLIB,"Coordinate DM in 2 dimensions must have 0 or 2 dof on each stratum, but stratum %d has %d dof",s,stagCoord->dof[s]);
70: }
71: DMGetLocalVector(dmCoord,&coordLocal);
73: DMStagVecGetArray(dmCoord,coordLocal,&arr);
74: if (stagCoord->dof[0]) {
75: DMStagGetLocationSlot(dmCoord,DMSTAG_DOWN_LEFT,0,&idownleft);
76: }
77: if (stagCoord->dof[1]) {
78: DMStagGetLocationSlot(dmCoord,DMSTAG_DOWN ,0,&idown );
79: DMStagGetLocationSlot(dmCoord,DMSTAG_LEFT ,0,&ileft );
80: }
81: if (stagCoord->dof[2]) {
82: DMStagGetLocationSlot(dmCoord,DMSTAG_ELEMENT ,0,&ielement );
83: }
84: DMStagGetCorners(dmCoord,&start[0],&start[1],NULL,&n[0],&n[1],NULL,&nExtra[0],&nExtra[1],NULL);
86: min[0] = xmin; min[1]= ymin;
87: h[0] = (xmax-xmin)/stagCoord->N[0];
88: h[1] = (ymax-ymin)/stagCoord->N[1];
90: for(ind[1]=start[1]; ind[1]<start[1] + n[1] + nExtra[1]; ++ind[1]) {
91: for(ind[0]=start[0]; ind[0]<start[0] + n[0] + nExtra[0]; ++ind[0]) {
92: if (stagCoord->dof[0]) {
93: const PetscReal offs[2] = {0.0,0.0};
94: for (c=0; c<2; ++c) {
95: arr[ind[1]][ind[0]][idownleft + c] = min[c] + ((PetscReal)ind[c] + offs[c]) * h[c];
96: }
97: }
98: if (stagCoord->dof[1]) {
99: const PetscReal offs[2] = {0.5,0.0};
100: for (c=0; c<2; ++c) {
101: arr[ind[1]][ind[0]][idown + c] = min[c] + ((PetscReal)ind[c] + offs[c]) * h[c];
102: }
103: }
104: if (stagCoord->dof[1]) {
105: const PetscReal offs[2] = {0.0,0.5};
106: for (c=0; c<2; ++c) {
107: arr[ind[1]][ind[0]][ileft + c] = min[c] + ((PetscReal)ind[c] + offs[c]) * h[c];
108: }
109: }
110: if (stagCoord->dof[2]) {
111: const PetscReal offs[2] = {0.5,0.5};
112: for (c=0; c<2; ++c) {
113: arr[ind[1]][ind[0]][ielement + c] = min[c] + ((PetscReal)ind[c] + offs[c]) * h[c];
114: }
115: }
116: }
117: }
118: DMStagVecRestoreArray(dmCoord,coordLocal,&arr);
119: DMCreateGlobalVector(dmCoord,&coord);
120: DMLocalToGlobalBegin(dmCoord,coordLocal,INSERT_VALUES,coord);
121: DMLocalToGlobalEnd(dmCoord,coordLocal,INSERT_VALUES,coord);
122: DMSetCoordinates(dm,coord);
123: PetscLogObjectParent((PetscObject)dm,(PetscObject)coord);
124: DMRestoreLocalVector(dmCoord,&coordLocal);
125: VecDestroy(&coord);
126: return(0);
127: }
129: /* Helper functions used in DMSetUp_Stag() */
130: static PetscErrorCode DMStagSetUpBuildRankGrid_2d(DM);
131: static PetscErrorCode DMStagSetUpBuildNeighbors_2d(DM);
132: static PetscErrorCode DMStagSetUpBuildGlobalOffsets_2d(DM,PetscInt**);
133: static PetscErrorCode DMStagComputeLocationOffsets_2d(DM);
135: PETSC_INTERN PetscErrorCode DMSetUp_Stag_2d(DM dm)
136: {
137: PetscErrorCode ierr;
138: DM_Stag * const stag = (DM_Stag*)dm->data;
139: PetscMPIInt size,rank;
140: PetscInt i,j,d,entriesPerElementRowGhost,entriesPerCorner,entriesPerEdge,entriesPerElementRow;
141: MPI_Comm comm;
142: PetscInt *globalOffsets;
143: PetscBool star,dummyStart[2],dummyEnd[2];
144: const PetscInt dim = 2;
147: PetscObjectGetComm((PetscObject)dm,&comm);
148: MPI_Comm_size(comm,&size);
149: MPI_Comm_rank(comm,&rank);
151: /* Rank grid sizes (populates stag->nRanks) */
152: DMStagSetUpBuildRankGrid_2d(dm);
154: /* Determine location of rank in grid (these get extra boundary points on the last element)
155: Order is x-fast, as usual */
156: stag->rank[0] = rank % stag->nRanks[0];
157: stag->rank[1] = rank / stag->nRanks[0];
158: for(i=0; i<dim; ++i) {
159: stag->firstRank[i] = PetscNot(stag->rank[i]);
160: stag->lastRank[i] = (PetscBool)(stag->rank[i] == stag->nRanks[i]-1);
161: }
163: /* Determine Locally owned region
165: Divide equally, giving lower ranks in each dimension and extra element if needbe.
167: Note that this uses O(P) storage. If this ever becomes an issue, this could
168: be refactored to not keep this data around. */
169: for (i=0; i<dim; ++i) {
170: if (!stag->l[i]) {
171: const PetscInt Ni = stag->N[i], nRanksi = stag->nRanks[i];
172: PetscMalloc1(stag->nRanks[i],&stag->l[i]);
173: for (j=0; j<stag->nRanks[i]; ++j){
174: stag->l[i][j] = Ni/nRanksi + ((Ni % nRanksi) > j);
175: }
176: }
177: }
179: /* Retrieve local size in stag->n */
180: for (i=0; i<dim; ++i) stag->n[i] = stag->l[i][stag->rank[i]];
181: #if defined(PETSC_USE_DEBUG)
182: for (i=0; i<dim; ++i) {
183: PetscInt Ncheck,j;
184: Ncheck = 0;
185: for (j=0; j<stag->nRanks[i]; ++j) Ncheck += stag->l[i][j];
186: if (Ncheck != stag->N[i]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local sizes in dimension %d don't add up. %d != %d\n",i,Ncheck,stag->N[i]);
187: }
188: #endif
190: /* Compute starting elements */
191: for (i=0; i<dim; ++i) {
192: stag->start[i] = 0;
193: for(j=0;j<stag->rank[i];++j){
194: stag->start[i] += stag->l[i][j];
195: }
196: }
198: /* Determine ranks of neighbors, using DMDA's convention
200: n6 n7 n8
201: n3 n5
202: n0 n1 n2 */
203: DMStagSetUpBuildNeighbors_2d(dm);
205: /* Determine whether the ghost region includes dummies or not. This is currently
206: equivalent to having a non-periodic boundary. If not, then
207: ghostOffset{Start,End}[d] elements correspond to elements on the neighbor.
208: If true, then
209: - at the start, there are ghostOffsetStart[d] ghost elements
210: - at the end, there is a layer of extra "physical" points inside a layer of
211: ghostOffsetEnd[d] ghost elements
212: Note that this computation should be updated if any boundary types besides
213: NONE, GHOSTED, and PERIODIC are supported. */
214: for (d=0; d<2; ++d) dummyStart[d] = (PetscBool)(stag->firstRank[d] && stag->boundaryType[d] != DM_BOUNDARY_PERIODIC);
215: for (d=0; d<2; ++d) dummyEnd[d] = (PetscBool)(stag->lastRank[d] && stag->boundaryType[d] != DM_BOUNDARY_PERIODIC);
217: /* Define useful sizes */
218: stag->entriesPerElement = stag->dof[0] + 2*stag->dof[1] + stag->dof[2];
219: entriesPerEdge = stag->dof[0] + stag->dof[1];
220: entriesPerCorner = stag->dof[0];
221: entriesPerElementRow = stag->n[0]*stag->entriesPerElement + (dummyEnd[0] ? entriesPerEdge : 0);
222: stag->entries = stag->n[1]*entriesPerElementRow + (dummyEnd[1] ? stag->n[0]*entriesPerEdge : 0 ) + (dummyEnd[0] && dummyEnd[1] ? entriesPerCorner: 0);
224: /* Compute offsets for each rank into global vectors
225: This again requires O(P) storage, which could be replaced with some global
226: communication. */
227: DMStagSetUpBuildGlobalOffsets_2d(dm,&globalOffsets);
229: for (d=0; d<dim; ++d) if (stag->boundaryType[d] != DM_BOUNDARY_NONE && stag->boundaryType[d] != DM_BOUNDARY_PERIODIC && stag->boundaryType[d] != DM_BOUNDARY_GHOSTED) SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_SUP,"Unsupported boundary type");
231: /* Define ghosted/local sizes */
232: for (d=0; d<dim; ++d) {
233: switch (stag->boundaryType[d]) {
234: case DM_BOUNDARY_NONE:
235: /* Note: for a elements-only DMStag, the extra elements on the edges aren't necessary but we include them anyway */
236: switch (stag->stencilType) {
237: case DMSTAG_STENCIL_NONE : /* only the extra one on the right/top edges */
238: stag->nGhost[d] = stag->n[d];
239: stag->startGhost[d] = stag->start[d];
240: if (stag->lastRank[d]) stag->nGhost[d] += 1;
241: break;
242: case DMSTAG_STENCIL_STAR : /* allocate the corners but don't use them */
243: case DMSTAG_STENCIL_BOX :
244: stag->nGhost[d] = stag->n[d];
245: stag->startGhost[d] = stag->start[d];
246: if (!stag->firstRank[d]) {
247: stag->nGhost[d] += stag->stencilWidth; /* add interior ghost elements */
248: stag->startGhost[d] -= stag->stencilWidth;
249: }
250: if (!stag->lastRank[d]) {
251: stag->nGhost[d] += stag->stencilWidth; /* add interior ghost elements */
252: } else {
253: stag->nGhost[d] += 1; /* one element on the boundary to complete blocking */
254: }
255: break;
256: default :
257: SETERRQ1(PETSC_COMM_WORLD,PETSC_ERR_SUP,"Unrecognized ghost stencil type %d",stag->stencilType);
258: }
259: break;
260: case DM_BOUNDARY_GHOSTED:
261: switch (stag->stencilType) {
262: case DMSTAG_STENCIL_NONE :
263: stag->startGhost[d] = stag->start[d];
264: stag->nGhost[d] = stag->n[d] + (stag->lastRank[d] ? 1 : 0);
265: break;
266: case DMSTAG_STENCIL_STAR :
267: case DMSTAG_STENCIL_BOX :
268: stag->startGhost[d] = stag->start[d] - stag->stencilWidth; /* This value may be negative */
269: stag->nGhost[d] = stag->n[d] + 2*stag->stencilWidth + (stag->lastRank[d] && stag->stencilWidth == 0 ? 1 : 0);
270: break;
271: default :
272: SETERRQ1(PETSC_COMM_WORLD,PETSC_ERR_SUP,"Unrecognized ghost stencil type %d",stag->stencilType);
273: }
274: break;
275: case DM_BOUNDARY_PERIODIC:
276: switch (stag->stencilType) {
277: case DMSTAG_STENCIL_NONE : /* only the extra one on the right/top edges */
278: stag->nGhost[d] = stag->n[d];
279: stag->startGhost[d] = stag->start[d];
280: break;
281: case DMSTAG_STENCIL_STAR :
282: case DMSTAG_STENCIL_BOX :
283: stag->nGhost[d] = stag->n[d] + 2*stag->stencilWidth;
284: stag->startGhost[d] = stag->start[d] - stag->stencilWidth;
285: break;
286: default :
287: SETERRQ1(PETSC_COMM_WORLD,PETSC_ERR_SUP,"Unrecognized ghost stencil type %d",stag->stencilType);
288: }
289: break;
290: default: SETERRQ1(PETSC_COMM_WORLD,PETSC_ERR_SUP,"Unsupported boundary type in dimension %D",d);
291: }
292: }
293: stag->entriesGhost = stag->nGhost[0]*stag->nGhost[1]*stag->entriesPerElement;
294: entriesPerElementRowGhost = stag->nGhost[0]*stag->entriesPerElement;
296: /* Create global-->local VecScatter and local->global ISLocalToGlobalMapping
298: We iterate over all local points twice. First, we iterate over each neighbor, populating
299: 1. idxLocal[] : the subset of points, in local numbering ("S" from 0 on all points including ghosts), which correspond to global points. That is, the set of all non-dummy points in the ghosted representation
300: 2. idxGlobal[]: the corresponding global points, in global numbering (Nested "S"s - ranks then non-ghost points in each rank)
302: Next, we iterate over all points in the local ordering, populating
303: 3. idxGlobalAll[] : entry i is the global point corresponding to local point i, or -1 if local point i is a dummy.
305: Note further here that the local/ghosted vectors:
306: - Are always an integral number of elements-worth of points, in all directions.
307: - Contain three flavors of points:
308: 1. Points which "live here" in the global representation
309: 2. Ghost points which correspond to points on other ranks in the global representation
310: 3. Ghost points, which we call "dummy points," which do not correspond to any point in the global representation
312: Dummy ghost points arise in at least three ways:
313: 1. As padding for the right, top, and front physical boundaries, to complete partial elements
314: 2. As unused space in the "corners" on interior ranks when using a star stencil
315: 3. As additional work space on all physical boundaries, when DM_BOUNDARY_GHOSTED is used
317: Note that, because of the boundary dummies,
318: with a stencil width of zero, on 1 rank, local and global vectors
319: are still different!
321: We assume that the size on each rank is greater than or equal to the
322: stencil width.
323: */
325: if (stag->n[0] < stag->stencilWidth || stag->n[1] < stag->stencilWidth) {
326: SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_SUP,"DMStag 2d setup does not support local sizes (%D x %D) smaller than the elementwise stencil width (%D)",stag->n[0],stag->n[1],stag->stencilWidth);
327: }
329: /* Check stencil type */
330: if (stag->stencilType != DMSTAG_STENCIL_NONE && stag->stencilType != DMSTAG_STENCIL_BOX && stag->stencilType != DMSTAG_STENCIL_STAR) SETERRQ1(PetscObjectComm((PetscObject)dm),PETSC_ERR_SUP,"Unsupported stencil type %s",DMStagStencilTypes[stag->stencilType]);
331: if (stag->stencilType == DMSTAG_STENCIL_NONE && stag->stencilWidth != 0) SETERRQ(PetscObjectComm((PetscObject)dm),PETSC_ERR_SUP,"DMStag 2d setup requries stencil width 0 with stencil type none");
332: star = (PetscBool)(stag->stencilType == DMSTAG_STENCIL_STAR);
334: {
335: PetscInt *idxLocal,*idxGlobal,*idxGlobalAll;
336: PetscInt count,countAll,entriesToTransferTotal,i,j,d,ghostOffsetStart[2],ghostOffsetEnd[2];
337: IS isLocal,isGlobal;
338: PetscInt jghost,ighost;
339: PetscInt nNeighbors[9][2];
340: PetscBool nextToDummyEnd[2];
342: /* Compute numbers of elements on each neighbor */
343: for (i=0; i<9; ++i) {
344: const PetscInt neighborRank = stag->neighbors[i];
345: if (neighborRank >= 0) { /* note we copy the values for our own rank (neighbor 4) */
346: nNeighbors[i][0] = stag->l[0][neighborRank % stag->nRanks[0]];
347: nNeighbors[i][1] = stag->l[1][neighborRank / stag->nRanks[0]];
348: } /* else leave uninitialized - error if accessed */
349: }
351: /* These offsets should always be non-negative, and describe how many
352: ghost elements exist at each boundary. These are not always equal to the stencil width,
353: because we may have different numbers of ghost elements at the boundaries. In particular,
354: we always have at least one ghost (dummy) element at the right/top/front. */
355: for (d=0; d<2; ++d) ghostOffsetStart[d] = stag->start[d] - stag->startGhost[d];
356: for (d=0; d<2; ++d) ghostOffsetEnd[d] = stag->startGhost[d]+stag->nGhost[d] - (stag->start[d]+stag->n[d]);
358: /* Compute whether the next rank has an extra point (only used in x direction) */
359: for (d=0;d<2;++d) nextToDummyEnd[d] = (PetscBool)(stag->boundaryType[d] != DM_BOUNDARY_PERIODIC && stag->rank[d] == stag->nRanks[d]-2);
361: /* Compute the number of local entries which correspond to any global entry */
362: {
363: PetscInt nNonDummyGhost[2];
364: for (d=0; d<2; ++d) nNonDummyGhost[d] = stag->nGhost[d] - (dummyStart[d] ? ghostOffsetStart[d] : 0) - (dummyEnd[d] ? ghostOffsetEnd[d] : 0);
365: if (star) {
366: entriesToTransferTotal = (nNonDummyGhost[0] * stag->n[1] + stag->n[0] * nNonDummyGhost[1] - stag->n[0] * stag->n[1]) * stag->entriesPerElement
367: + (dummyEnd[0] ? nNonDummyGhost[1] * entriesPerEdge : 0)
368: + (dummyEnd[1] ? nNonDummyGhost[0] * entriesPerEdge : 0)
369: + (dummyEnd[0] && dummyEnd[1] ? entriesPerCorner : 0);
370: } else {
371: entriesToTransferTotal = nNonDummyGhost[0] * nNonDummyGhost[1] * stag->entriesPerElement
372: + (dummyEnd[0] ? nNonDummyGhost[1] * entriesPerEdge : 0)
373: + (dummyEnd[1] ? nNonDummyGhost[0] * entriesPerEdge : 0)
374: + (dummyEnd[0] && dummyEnd[1] ? entriesPerCorner : 0);
375: }
376: }
378: /* Allocate arrays to populate */
379: PetscMalloc1(entriesToTransferTotal,&idxLocal);
380: PetscMalloc1(entriesToTransferTotal,&idxGlobal);
382: /* Counts into idxLocal/idxGlobal */
383: count = 0;
385: /* Here and below, we work with (i,j) describing element numbers within a neighboring rank's global ordering,
386: to be offset by that rank's global offset,
387: and (ighost,jghost) referring to element numbers within this ranks local (ghosted) ordering */
389: /* Neighbor 0 (down left) */
390: if (!star && !dummyStart[0] && !dummyStart[1]) {
391: const PetscInt neighbor = 0;
392: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
393: const PetscInt * const nNeighbor = nNeighbors[neighbor];
394: const PetscInt entriesPerElementRowNeighbor = stag->entriesPerElement * nNeighbor[0];
395: for (jghost = 0; jghost<ghostOffsetStart[1]; ++jghost) {
396: const PetscInt j = nNeighbor[1] - ghostOffsetStart[1] + jghost;
397: for (ighost = 0; ighost<ghostOffsetStart[0]; ++ighost) {
398: const PetscInt i = nNeighbor[0] - ghostOffsetStart[0] + ighost;
399: for (d=0; d<stag->entriesPerElement; ++d,++count) {
400: idxGlobal[count] = globalOffset + j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + d;
401: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
402: }
403: }
404: }
405: }
407: /* Neighbor 1 (down) */
408: if (!dummyStart[1]) {
409: /* We may be a ghosted boundary in x, in which case the neighbor is also */
410: const PetscInt neighbor = 1;
411: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
412: const PetscInt * const nNeighbor = nNeighbors[neighbor];
413: const PetscInt entriesPerElementRowNeighbor = entriesPerElementRow; /* same as here */
414: for (jghost = 0; jghost<ghostOffsetStart[1]; ++jghost) {
415: const PetscInt j = nNeighbor[1] - ghostOffsetStart[1] + jghost;
416: for (ighost = ghostOffsetStart[0]; ighost<stag->nGhost[0]-ghostOffsetEnd[0]; ++ighost) {
417: const PetscInt i = ighost - ghostOffsetStart[0];
418: for (d=0; d<stag->entriesPerElement; ++d, ++count) {
419: idxGlobal[count] = globalOffset+ j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + d;
420: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
421: }
422: }
423: if (dummyEnd[0]) {
424: const PetscInt ighost = stag->nGhost[0]-ghostOffsetEnd[0];
425: const PetscInt i = stag->n[0];
426: for (d=0; d<stag->dof[0]; ++d, ++count) { /* Vertex */
427: idxGlobal[count] = globalOffset + j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + d;
428: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
429: }
430: for (d=0; d<stag->dof[1]; ++d,++count) { /* Edge */
431: idxGlobal[count] = globalOffset + j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + stag->dof[0] + d;
432: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + stag->dof[0] + stag->dof[1] + d;
433: }
434: }
435: }
436: }
438: /* Neighbor 2 (down right) */
439: if (!star && !dummyEnd[0] && !dummyStart[1]) {
440: const PetscInt neighbor = 2;
441: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
442: const PetscInt * const nNeighbor = nNeighbors[neighbor];
443: const PetscInt entriesPerElementRowNeighbor = nNeighbor[0]*stag->entriesPerElement + (nextToDummyEnd[0] ? entriesPerEdge : 0);
444: for (jghost = 0; jghost<ghostOffsetStart[1]; ++jghost) {
445: const PetscInt j = nNeighbor[1] - ghostOffsetStart[1] + jghost;
446: for (i=0; i<ghostOffsetEnd[0]; ++i) {
447: const PetscInt ighost = stag->nGhost[0] - ghostOffsetEnd[0] + i;
448: for (d=0; d<stag->entriesPerElement; ++d, ++count) {
449: idxGlobal[count] = globalOffset + j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + d;
450: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
451: }
452: }
453: }
454: }
456: /* Neighbor 3 (left) */
457: if (!dummyStart[0]) {
458: /* Our neighbor is never a ghosted boundary in x, but we may be
459: Here, we may be a ghosted boundary in y and thus so will our neighbor be */
460: const PetscInt neighbor = 3;
461: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
462: const PetscInt * const nNeighbor = nNeighbors[neighbor];
463: const PetscInt entriesPerElementRowNeighbor = nNeighbor[0]*stag->entriesPerElement;
464: for (jghost = ghostOffsetStart[1]; jghost<stag->nGhost[1] - ghostOffsetEnd[1]; ++jghost) {
465: const PetscInt j = jghost-ghostOffsetStart[1];
466: for (ighost = 0; ighost<ghostOffsetStart[0]; ++ighost) {
467: const PetscInt i = nNeighbor[0] - ghostOffsetStart[0] + ighost;
468: for (d=0; d<stag->entriesPerElement; ++d, ++count) {
469: idxGlobal[count] = globalOffset + j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + d;
470: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
471: }
472: }
473: }
474: if (dummyEnd[1]) {
475: const PetscInt jghost = stag->nGhost[1]-ghostOffsetEnd[1];
476: const PetscInt j = stag->n[1];
477: for (ighost = 0; ighost<ghostOffsetStart[0]; ++ighost) {
478: const PetscInt i = nNeighbor[0] - ghostOffsetStart[0] + ighost;
479: for (d=0; d<entriesPerEdge; ++d, ++count) { /* only vertices and horizontal edge (which are the first dof) */
480: idxGlobal[count] = globalOffset + j *entriesPerElementRowNeighbor + i *entriesPerEdge + d; /* i moves by edge here */
481: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
482: }
483: }
484: }
485: }
487: /* Interior/Resident-here-in-global elements ("Neighbor 4" - same rank)
488: *including* entries from boundary dummy elements */
489: {
490: const PetscInt neighbor = 4;
491: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
492: for (j=0; j<stag->n[1]; ++j) {
493: const PetscInt jghost = j + ghostOffsetStart[1];
494: for (i=0; i<stag->n[0]; ++i) {
495: const PetscInt ighost = i + ghostOffsetStart[0];
496: for (d=0; d<stag->entriesPerElement; ++d, ++count) {
497: idxGlobal[count] = globalOffset + j *entriesPerElementRow + i *stag->entriesPerElement + d;
498: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
499: }
500: }
501: if (dummyEnd[0]) {
502: const PetscInt ighost = i + ghostOffsetStart[0];
503: i = stag->n[0];
504: for (d=0; d<stag->dof[0]; ++d, ++count) { /* vertex first */
505: idxGlobal[count] = globalOffset + j *entriesPerElementRow + i *stag->entriesPerElement + d;
506: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
507: }
508: for (d=0; d<stag->dof[1]; ++d, ++count) { /* then left ege (skipping bottom edge) */
509: idxGlobal[count] = globalOffset + j *entriesPerElementRow + i *stag->entriesPerElement + stag->dof[0] + d;
510: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + stag->dof[0] + stag->dof[1] + d;
511: }
512: }
513: }
514: if (dummyEnd[1]) {
515: const PetscInt jghost = j + ghostOffsetStart[1];
516: j = stag->n[1];
517: for (i=0; i<stag->n[0]; ++i) {
518: const PetscInt ighost = i + ghostOffsetStart[0];
519: for (d=0; d<entriesPerEdge; ++d, ++count) { /* vertex and bottom edge (which are the first entries) */
520: idxGlobal[count] = globalOffset + j *entriesPerElementRow + i*entriesPerEdge + d; /* note i increment by entriesPerEdge */
521: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
522: }
523: }
524: if (dummyEnd[0]) {
525: const PetscInt ighost = i + ghostOffsetStart[0];
526: i = stag->n[0];
527: for (d=0; d<entriesPerCorner; ++d, ++count) { /* vertex only */
528: idxGlobal[count] = globalOffset + j *entriesPerElementRow + i *entriesPerEdge + d; /* note i increment by entriesPerEdge */
529: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
530: }
531: }
532: }
533: }
535: /* Neighbor 5 (right) */
536: if (!dummyEnd[0]) {
537: /* We can never be right boundary, but we may be a top boundary, along with the right neighbor */
538: const PetscInt neighbor = 5;
539: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
540: const PetscInt * const nNeighbor = nNeighbors[neighbor];
541: const PetscInt entriesPerElementRowNeighbor = nNeighbor[0]*stag->entriesPerElement + (nextToDummyEnd[0] ? entriesPerEdge : 0);
542: for (jghost = ghostOffsetStart[1];jghost<stag->nGhost[1]-ghostOffsetEnd[1]; ++jghost) {
543: const PetscInt j = jghost-ghostOffsetStart[1];
544: for (i=0; i<ghostOffsetEnd[0]; ++i) {
545: const PetscInt ighost = stag->nGhost[0] - ghostOffsetEnd[0] + i;
546: for (d=0; d<stag->entriesPerElement; ++d, ++count) {
547: idxGlobal[count] = globalOffset+ j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + d;
548: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
549: }
550: }
551: }
552: if (dummyEnd[1]) {
553: const PetscInt jghost = stag->nGhost[1]-ghostOffsetEnd[1];
554: const PetscInt j = nNeighbor[1];
555: for (i=0; i<ghostOffsetEnd[0]; ++i) {
556: const PetscInt ighost = stag->nGhost[0] - ghostOffsetEnd[0] + i;
557: for (d=0; d<entriesPerEdge; ++d, ++count) { /* only vertices and horizontal edge (which are the first dof) */
558: idxGlobal[count] = globalOffset+ j *entriesPerElementRowNeighbor + i *entriesPerEdge + d; /* Note i increment by entriesPerEdge */
559: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
560: }
561: }
562: }
563: }
565: /* Neighbor 6 (up left) */
566: if (!star && !dummyStart[0] && !dummyEnd[1]) {
567: /* We can never be a top boundary, but our neighbor may be
568: We may be a right boundary, but our neighbor cannot be */
569: const PetscInt neighbor = 6;
570: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
571: const PetscInt * const nNeighbor = nNeighbors[neighbor];
572: const PetscInt entriesPerElementRowNeighbor = nNeighbor[0]*stag->entriesPerElement;
573: for (j=0; j<ghostOffsetEnd[1]; ++j) {
574: const PetscInt jghost = stag->nGhost[1] - ghostOffsetEnd[1] + j;
575: for (ighost = 0; ighost<ghostOffsetStart[0]; ++ighost) {
576: const PetscInt i = nNeighbor[0] - ghostOffsetStart[0] + ighost;
577: for (d=0; d<stag->entriesPerElement; ++d, ++count) {
578: idxGlobal[count] = globalOffset+ j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + d;
579: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
580: }
581: }
582: }
583: }
585: /* Neighbor 7 (up) */
586: if (!dummyEnd[1]) {
587: /* We cannot be the last rank in y, though our neighbor may be
588: We may be the last rank in x, in which case our neighbor is also */
589: const PetscInt neighbor = 7;
590: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
591: const PetscInt * const nNeighbor = nNeighbors[neighbor];
592: const PetscInt entriesPerElementRowNeighbor = entriesPerElementRow; /* same as here */
593: for (j=0; j<ghostOffsetEnd[1]; ++j) {
594: const PetscInt jghost = stag->nGhost[1] - ghostOffsetEnd[1] + j;
595: for (ighost = ghostOffsetStart[0]; ighost<stag->nGhost[0]-ghostOffsetEnd[0]; ++ighost) {
596: const PetscInt i = ighost - ghostOffsetStart[0];
597: for (d=0; d<stag->entriesPerElement; ++d, ++count) {
598: idxGlobal[count] = globalOffset + j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + d;
599: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
600: }
601: }
602: if (dummyEnd[0]) {
603: const PetscInt ighost = stag->nGhost[0]-ghostOffsetEnd[0];
604: const PetscInt i = nNeighbor[0];
605: for (d=0; d<stag->dof[0]; ++d, ++count) { /* Vertex */
606: idxGlobal[count] = globalOffset+ j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + d;
607: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
608: }
609: for (d=0; d<stag->dof[1]; ++d, ++count) { /* Edge */
610: idxGlobal[count] = globalOffset+ j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + stag->dof[0] + d;
611: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + stag->dof[0] + stag->dof[1] + d;
612: }
613: }
614: }
615: }
617: /* Neighbor 8 (up right) */
618: if (!star && !dummyEnd[0] && !dummyEnd[1]) {
619: /* We can never be a ghosted boundary
620: Our neighbor may be a top boundary, a right boundary, or both */
621: const PetscInt neighbor = 8;
622: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
623: const PetscInt * const nNeighbor = nNeighbors[neighbor];
624: const PetscInt entriesPerElementRowNeighbor = nNeighbor[0]*stag->entriesPerElement + (nextToDummyEnd[0] ? entriesPerEdge : 0);
625: for (j=0; j<ghostOffsetEnd[1]; ++j) {
626: const PetscInt jghost = stag->nGhost[1] - ghostOffsetEnd[1] + j;
627: for (i=0; i<ghostOffsetEnd[0]; ++i) {
628: const PetscInt ighost = stag->nGhost[0] - ghostOffsetEnd[0] + i;
629: for (d=0; d<stag->entriesPerElement; ++d, ++count) {
630: idxGlobal[count] = globalOffset + j *entriesPerElementRowNeighbor + i *stag->entriesPerElement + d;
631: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
632: }
633: }
634: }
635: }
637: #if defined(PETSC_USE_DEBUG)
638: if (count != entriesToTransferTotal) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Number of entries computed in gtol (%d) is not as expected (%d)",count,entriesToTransferTotal);
639: #endif
641: /* Create Local and Global ISs (transferring pointer ownership) */
642: ISCreateGeneral(PetscObjectComm((PetscObject)dm),entriesToTransferTotal,idxLocal,PETSC_OWN_POINTER,&isLocal);
643: ISCreateGeneral(PetscObjectComm((PetscObject)dm),entriesToTransferTotal,idxGlobal,PETSC_OWN_POINTER,&isGlobal);
645: /* Create stag->gtol. The order is computed as PETSc ordering, and doesn't include dummy entries */
646: {
647: Vec local,global;
648: VecCreateMPIWithArray(PetscObjectComm((PetscObject)dm),1,stag->entries,PETSC_DECIDE,NULL,&global);
649: VecCreateSeqWithArray(PETSC_COMM_SELF,stag->entriesPerElement,stag->entriesGhost,NULL,&local);
650: VecScatterCreate(global,isGlobal,local,isLocal,&stag->gtol);
651: VecDestroy(&global);
652: VecDestroy(&local);
653: }
655: /* Destroy ISs */
656: ISDestroy(&isLocal);
657: ISDestroy(&isGlobal);
659: /* Next, we iterate over the local entries again, in local order, recording the global entry to which each maps,
660: or -1 if there is none */
661: PetscMalloc1(stag->entriesGhost,&idxGlobalAll);
663: countAll = 0;
665: /* Loop over rows 1/3 : down */
666: if (!dummyStart[1]) {
667: for (jghost=0; jghost<ghostOffsetStart[1]; ++jghost) {
669: /* Loop over columns 1/3 : down left */
670: if (!star && !dummyStart[0]) {
671: const PetscInt neighbor = 0;
672: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
673: const PetscInt * const nNeighbor = nNeighbors[neighbor];
674: const PetscInt j = nNeighbor[1] - ghostOffsetStart[1] + jghost; /* Note: this is actually the same value for the whole row of ranks below, so recomputing it for the next two ranks is redundant, and one could even get rid of jghost entirely if desired */
675: const PetscInt eprNeighbor = nNeighbor[0] * stag->entriesPerElement;
676: for (i=nNeighbor[0]-ghostOffsetStart[0]; i<nNeighbor[0]; ++i) {
677: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
678: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + d;
679: }
680: }
681: } else {
682: /* Down Left dummies */
683: for (ighost=0; ighost<ghostOffsetStart[0]; ++ighost) {
684: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
685: idxGlobalAll[countAll] = -1;
686: }
687: }
688: }
690: /* Loop over columns 2/3 : down middle */
691: {
692: const PetscInt neighbor = 1;
693: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
694: const PetscInt * const nNeighbor = nNeighbors[neighbor];
695: const PetscInt j = nNeighbor[1] - ghostOffsetStart[1] + jghost;
696: const PetscInt eprNeighbor = entriesPerElementRow; /* same as here */
697: for (i=0; i<nNeighbor[0]; ++i) {
698: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
699: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + d;
700: }
701: }
702: }
704: /* Loop over columns 3/3 : down right */
705: if (!star && !dummyEnd[0]) {
706: const PetscInt neighbor = 2;
707: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
708: const PetscInt * const nNeighbor = nNeighbors[neighbor];
709: const PetscInt j = nNeighbor[1] - ghostOffsetStart[1] + jghost;
710: const PetscInt eprNeighbor = nNeighbor[0]*stag->entriesPerElement + (nextToDummyEnd[0] ? entriesPerEdge : 0);
711: for (i=0; i<ghostOffsetEnd[0]; ++i) {
712: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
713: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + d;
714: }
715: }
716: } else if (dummyEnd[0]) {
717: /* Down right partial dummy elements, living on the *down* rank */
718: const PetscInt neighbor = 1;
719: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
720: const PetscInt * const nNeighbor = nNeighbors[neighbor];
721: const PetscInt j = nNeighbor[1] - ghostOffsetStart[1] + jghost;
722: const PetscInt eprNeighbor = entriesPerElementRow; /* same as here */
723: PetscInt dGlobal;
724: i = nNeighbor[0];
725: for (d=0,dGlobal=0; d<stag->dof[0]; ++d, ++dGlobal, ++countAll) {
726: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + dGlobal;
727: }
728: for (; d<stag->dof[0] + stag->dof[1]; ++d, ++countAll) {
729: idxGlobalAll[countAll] = -1; /* dummy down edge point */
730: }
731: for (; d<stag->dof[0] + 2*stag->dof[1]; ++d, ++dGlobal, ++countAll) {
732: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + dGlobal;
733: }
734: for (; d<stag->entriesPerElement; ++d, ++countAll) {
735: idxGlobalAll[countAll] = -1; /* dummy element point */
736: }
737: ++i;
738: for (; i<nNeighbor[0]+ghostOffsetEnd[0]; ++i) {
739: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
740: idxGlobalAll[countAll] = -1;
741: }
742: }
743: } else {
744: /* Down Right dummies */
745: for (ighost=0; ighost<ghostOffsetEnd[0]; ++ighost) {
746: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
747: idxGlobalAll[countAll] = -1;
748: }
749: }
750: }
751: }
752: } else {
753: /* Down dummies row */
754: for (jghost=0; jghost<ghostOffsetStart[1]; ++jghost) {
755: for (ighost=0; ighost<stag->nGhost[0]; ++ighost) {
756: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
757: idxGlobalAll[countAll] = -1;
758: }
759: }
760: }
761: }
763: /* Loop over rows 2/3 : center */
764: for (j=0; j<stag->n[1]; ++j) {
765: /* Loop over columns 1/3 : left */
766: if (!dummyStart[0]) {
767: const PetscInt neighbor = 3;
768: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
769: const PetscInt * const nNeighbor = nNeighbors[neighbor];
770: const PetscInt eprNeighbor = nNeighbor[0] * stag->entriesPerElement;
771: for (i=nNeighbor[0]-ghostOffsetStart[0]; i<nNeighbor[0]; ++i) {
772: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
773: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + d;
774: }
775: }
776: } else {
777: /* (Middle) Left dummies */
778: for (ighost=0; ighost < ghostOffsetStart[0]; ++ighost) {
779: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
780: idxGlobalAll[countAll] = -1;
781: }
782: }
783: }
785: /* Loop over columns 2/3 : here (the "neighbor" is ourselves, here) */
786: {
787: const PetscInt neighbor = 4;
788: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
789: const PetscInt eprNeighbor = entriesPerElementRow; /* same as here (obviously) */
790: for (i=0; i<stag->n[0]; ++i) {
791: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
792: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + d;
793: }
794: }
795: }
797: /* Loop over columns 3/3 : right */
798: if (!dummyEnd[0]) {
799: const PetscInt neighbor = 5;
800: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
801: const PetscInt * const nNeighbor = nNeighbors[neighbor];
802: const PetscInt eprNeighbor = nNeighbor[0]*stag->entriesPerElement + (nextToDummyEnd[0] ? entriesPerEdge : 0);
803: for (i=0; i<ghostOffsetEnd[0]; ++i) {
804: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
805: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + d;
806: }
807: }
808: } else {
809: /* -1's for right layer of partial dummies, living on *this* rank */
810: const PetscInt neighbor = 4;
811: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
812: const PetscInt * const nNeighbor = nNeighbors[neighbor];
813: const PetscInt eprNeighbor = entriesPerElementRow; /* same as here (obviously) */
814: PetscInt dGlobal;
815: i = nNeighbor[0];
816: for (d=0,dGlobal=0; d<stag->dof[0]; ++d, ++dGlobal, ++countAll) {
817: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + dGlobal;
818: }
819: for (; d<stag->dof[0] + stag->dof[1]; ++d, ++countAll) {
820: idxGlobalAll[countAll] = -1; /* dummy down edge point */
821: }
822: for (; d<stag->dof[0] + 2*stag->dof[1]; ++d, ++dGlobal, ++countAll) {
823: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + dGlobal;
824: }
825: for (; d<stag->entriesPerElement; ++d, ++countAll) {
826: idxGlobalAll[countAll] = -1; /* dummy element point */
827: }
828: ++i;
829: for (; i<nNeighbor[0]+ghostOffsetEnd[0]; ++i) {
830: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
831: idxGlobalAll[countAll] = -1;
832: }
833: }
834: }
835: }
837: /* Loop over rows 3/3 : up */
838: if (!dummyEnd[1]) {
839: for (j=0; j<ghostOffsetEnd[1]; ++j) {
841: /* Loop over columns 1/3 : up left */
842: if (!star && !dummyStart[0]) {
843: const PetscInt neighbor = 6;
844: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
845: const PetscInt * const nNeighbor = nNeighbors[neighbor];
846: const PetscInt eprNeighbor = nNeighbor[0] * stag->entriesPerElement;
847: for (i=nNeighbor[0]-ghostOffsetStart[0]; i<nNeighbor[0]; ++i) {
848: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
849: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + d;
850: }
851: }
852: } else {
853: /* Up Left dummies */
854: for (ighost=0; ighost<ghostOffsetStart[0]; ++ighost) {
855: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
856: idxGlobalAll[countAll] = -1;
857: }
858: }
859: }
861: /* Loop over columns 2/3 : up */
862: {
863: const PetscInt neighbor = 7;
864: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
865: const PetscInt * const nNeighbor = nNeighbors[neighbor];
866: const PetscInt eprNeighbor = entriesPerElementRow; /* Same as here */
867: for (i=0; i<nNeighbor[0]; ++i) {
868: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
869: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + d;
870: }
871: }
872: }
874: /* Loop over columns 3/3 : up right */
875: if (!star && !dummyEnd[0]) {
876: const PetscInt neighbor = 8;
877: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
878: const PetscInt * const nNeighbor = nNeighbors[neighbor];
879: const PetscInt eprNeighbor = nNeighbor[0]*stag->entriesPerElement + (nextToDummyEnd[0] ? entriesPerEdge : 0);
880: for (i=0; i<ghostOffsetEnd[0]; ++i) {
881: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
882: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + d;
883: }
884: }
885: } else if (dummyEnd[0]) {
886: /* -1's for right layer of partial dummies, living on rank above */
887: const PetscInt neighbor = 7;
888: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
889: const PetscInt * const nNeighbor = nNeighbors[neighbor];
890: const PetscInt eprNeighbor = entriesPerElementRow; /* Same as here */
891: PetscInt dGlobal;
892: i = nNeighbor[0];
893: for (d=0,dGlobal=0; d<stag->dof[0]; ++d, ++dGlobal, ++countAll) {
894: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + dGlobal;
895: }
896: for (; d<stag->dof[0] + stag->dof[1]; ++d, ++countAll) {
897: idxGlobalAll[countAll] = -1; /* dummy down edge point */
898: }
899: for (; d<stag->dof[0] + 2*stag->dof[1]; ++d, ++dGlobal, ++countAll) {
900: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*stag->entriesPerElement + dGlobal;
901: }
902: for (; d<stag->entriesPerElement; ++d, ++countAll) {
903: idxGlobalAll[countAll] = -1; /* dummy element point */
904: }
905: ++i;
906: for (; i<nNeighbor[0]+ghostOffsetEnd[0]; ++i) {
907: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
908: idxGlobalAll[countAll] = -1;
909: }
910: }
911: } else {
912: /* Up Right dummies */
913: for (ighost=0; ighost<ghostOffsetEnd[0]; ++ighost) {
914: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
915: idxGlobalAll[countAll] = -1;
916: }
917: }
918: }
919: }
920: } else {
921: j = stag->n[1];
922: /* Top layer of partial dummies */
924: /* up left partial dummies layer : Loop over columns 1/3 : living on *left* neighbor */
925: if (!dummyStart[0]) {
926: const PetscInt neighbor = 3;
927: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
928: const PetscInt * const nNeighbor = nNeighbors[neighbor];
929: const PetscInt eprNeighbor = nNeighbor[0] * stag->entriesPerElement;
930: for (i=nNeighbor[0]-ghostOffsetStart[0]; i<nNeighbor[0]; ++i) {
931: for (d=0; d<stag->dof[0] + stag->dof[1]; ++d, ++countAll) {
932: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*entriesPerEdge + d; /* Note entriesPerEdge here */
933: }
934: for (; d<stag->entriesPerElement; ++d, ++countAll) {
935: idxGlobalAll[countAll] = -1; /* dummy left edge and element points */
936: }
937: }
938: } else {
939: for (ighost=0; ighost<ghostOffsetStart[0]; ++ighost) {
940: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
941: idxGlobalAll[countAll] = -1;
942: }
943: }
944: }
946: /* up partial dummies layer : Loop over columns 2/3 : living on *this* rank */
947: {
948: const PetscInt neighbor = 4;
949: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
950: const PetscInt eprNeighbor = entriesPerElementRow; /* same as here (obviously) */
951: for (i=0; i<stag->n[0]; ++i) {
952: for (d=0; d<stag->dof[0] + stag->dof[1]; ++d, ++countAll) {
953: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*entriesPerEdge + d; /* Note entriesPerEdge here */
954: }
955: for (; d<stag->entriesPerElement; ++d, ++countAll) {
956: idxGlobalAll[countAll] = -1; /* dummy left edge and element points */
957: }
958: }
959: }
961: if (!dummyEnd[0]) {
962: /* up right partial dummies layer : Loop over columns 3/3 : living on *right* neighbor */
963: const PetscInt neighbor = 5;
964: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
965: const PetscInt * const nNeighbor = nNeighbors[neighbor];
966: const PetscInt eprNeighbor = nNeighbor[0]*stag->entriesPerElement + (nextToDummyEnd[0] ? entriesPerEdge : 0);
967: for (i = 0; i<ghostOffsetEnd[0]; ++i) {
968: for (d=0; d<stag->dof[0] + stag->dof[1]; ++d, ++countAll) {
969: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*entriesPerEdge + d; /* Note entriesPerEdge here */
970: }
971: for (; d<stag->entriesPerElement; ++d, ++countAll) {
972: idxGlobalAll[countAll] = -1; /* dummy left edge and element points */
973: }
974: }
975: } else {
976: /* Top partial dummies layer : Loop over columns 3/3 : right, living *here* */
977: const PetscInt neighbor = 4;
978: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
979: const PetscInt eprNeighbor = entriesPerElementRow; /* same as here (obviously) */
980: i = stag->n[0];
981: for (d=0; d<stag->dof[0]; ++d, ++countAll) { /* Note just the vertex here */
982: idxGlobalAll[countAll] = globalOffset + j*eprNeighbor + i*entriesPerEdge + d; /* Note entriesPerEdge here */
983: }
984: for (; d<stag->entriesPerElement; ++d, ++countAll) {
985: idxGlobalAll[countAll] = -1; /* dummy bottom edge, left edge and element points */
986: }
987: ++i;
988: for (; i<stag->n[0] + ghostOffsetEnd[0]; ++i) {
989: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
990: idxGlobalAll[countAll] = -1;
991: }
992: }
993: }
994: ++j;
995: /* Additional top dummy layers */
996: for (; j<stag->n[1]+ghostOffsetEnd[1]; ++j) {
997: for (ighost=0; ighost<stag->nGhost[0]; ++ighost){
998: for (d=0; d<stag->entriesPerElement; ++d, ++countAll) {
999: idxGlobalAll[countAll] = -1;
1000: }
1001: }
1002: }
1003: }
1005: /* Create local-to-global map (in local ordering, includes maps to -1 for dummy points) */
1006: ISLocalToGlobalMappingCreate(comm,1,stag->entriesGhost,idxGlobalAll,PETSC_OWN_POINTER,&dm->ltogmap);
1007: PetscLogObjectParent((PetscObject)dm,(PetscObject)dm->ltogmap);
1008: }
1010: /* In special cases, create a dedicated injective local-to-global map */
1011: if ((stag->boundaryType[0] == DM_BOUNDARY_PERIODIC && stag->nRanks[0] == 1) ||
1012: (stag->boundaryType[1] == DM_BOUNDARY_PERIODIC && stag->nRanks[1] == 1)) {
1013: DMStagPopulateLocalToGlobalInjective(dm);
1014: }
1016: /* Free global offsets */
1017: PetscFree(globalOffsets);
1019: /* Precompute location offsets */
1020: DMStagComputeLocationOffsets_2d(dm);
1022: /* View from Options */
1023: DMViewFromOptions(dm,NULL,"-dm_view");
1025: return(0);
1026: }
1028: /* adapted from da2.c */
1029: static PetscErrorCode DMStagSetUpBuildRankGrid_2d(DM dm)
1030: {
1031: PetscErrorCode ierr;
1032: DM_Stag * const stag = (DM_Stag*)dm->data;
1033: PetscInt m,n;
1034: PetscMPIInt rank,size;
1035: const PetscInt M = stag->N[0];
1036: const PetscInt N = stag->N[1];
1039: MPI_Comm_size(PetscObjectComm((PetscObject)dm),&size);
1040: MPI_Comm_rank(PetscObjectComm((PetscObject)dm),&rank);
1041: m = stag->nRanks[0];
1042: n = stag->nRanks[1];
1043: if (m != PETSC_DECIDE) {
1044: if (m < 1) SETERRQ1(PetscObjectComm((PetscObject)dm),PETSC_ERR_ARG_OUTOFRANGE,"Non-positive number of ranks in X direction: %D",m);
1045: else if (m > size) SETERRQ2(PetscObjectComm((PetscObject)dm),PETSC_ERR_ARG_OUTOFRANGE,"Too many ranks in X direction: %D %d",m,size);
1046: }
1047: if (n != PETSC_DECIDE) {
1048: if (n < 1) SETERRQ1(PetscObjectComm((PetscObject)dm),PETSC_ERR_ARG_OUTOFRANGE,"Non-positive number of ranks in Y direction: %D",n);
1049: else if (n > size) SETERRQ2(PetscObjectComm((PetscObject)dm),PETSC_ERR_ARG_OUTOFRANGE,"Too many ranks in Y direction: %D %d",n,size);
1050: }
1051: if (m == PETSC_DECIDE || n == PETSC_DECIDE) {
1052: if (n != PETSC_DECIDE) {
1053: m = size/n;
1054: } else if (m != PETSC_DECIDE) {
1055: n = size/m;
1056: } else {
1057: /* try for squarish distribution */
1058: m = (PetscInt)(0.5 + PetscSqrtReal(((PetscReal)M)*((PetscReal)size)/((PetscReal)N)));
1059: if (!m) m = 1;
1060: while (m > 0) {
1061: n = size/m;
1062: if (m*n == size) break;
1063: m--;
1064: }
1065: if (M > N && m < n) {PetscInt _m = m; m = n; n = _m;}
1066: }
1067: if (m*n != size) SETERRQ(PetscObjectComm((PetscObject)dm),PETSC_ERR_PLIB,"Unable to create partition, check the size of the communicator and input m and n ");
1068: } else if (m*n != size) SETERRQ2(PetscObjectComm((PetscObject)dm),PETSC_ERR_ARG_OUTOFRANGE,"Given Bad partition. Product of sizes (%D) does not equal communicator size (%d)",m*n,size);
1069: if (M < m) SETERRQ2(PetscObjectComm((PetscObject)dm),PETSC_ERR_ARG_OUTOFRANGE,"Partition in x direction is too fine! %D %D",M,m);
1070: if (N < n) SETERRQ2(PetscObjectComm((PetscObject)dm),PETSC_ERR_ARG_OUTOFRANGE,"Partition in y direction is too fine! %D %D",N,n);
1071: stag->nRanks[0] = m;
1072: stag->nRanks[1] = n;
1073: return(0);
1074: }
1076: static PetscErrorCode DMStagSetUpBuildNeighbors_2d(DM dm)
1077: {
1078: PetscErrorCode ierr;
1079: DM_Stag * const stag = (DM_Stag*)dm->data;
1080: PetscInt d,i;
1081: PetscBool per[2],first[2],last[2];
1082: PetscInt neighborRank[9][2],r[2],n[2];
1083: const PetscInt dim = 2;
1086: for (d=0; d<dim; ++d) if (stag->boundaryType[d] != DM_BOUNDARY_NONE && stag->boundaryType[d] != DM_BOUNDARY_PERIODIC && stag->boundaryType[d] != DM_BOUNDARY_GHOSTED) SETERRQ1(PETSC_COMM_WORLD,PETSC_ERR_SUP,"Neighbor determination not implemented for %s",DMBoundaryTypes[stag->boundaryType[d]]);
1088: /* Assemble some convenience variables */
1089: for (d=0; d<dim; ++d) {
1090: per[d] = (PetscBool)(stag->boundaryType[d] == DM_BOUNDARY_PERIODIC);
1091: first[d] = stag->firstRank[d];
1092: last[d] = stag->lastRank[d];
1093: r[d] = stag->rank[d];
1094: n[d] = stag->nRanks[d];
1095: }
1097: /* First, compute the position in the rank grid for all neighbors */
1098: neighborRank[0][0] = first[0] ? (per[0] ? n[0]-1 : -1) : r[0] - 1; /* left down */
1099: neighborRank[0][1] = first[1] ? (per[1] ? n[1]-1 : -1) : r[1] - 1;
1101: neighborRank[1][0] = r[0] ; /* down */
1102: neighborRank[1][1] = first[1] ? (per[1] ? n[1]-1 : -1) : r[1] - 1;
1104: neighborRank[2][0] = last[0] ? (per[0] ? 0 : -1) : r[0] + 1; /* right down */
1105: neighborRank[2][1] = first[1] ? (per[1] ? n[1]-1 : -1) : r[1] - 1;
1107: neighborRank[3][0] = first[0] ? (per[0] ? n[0]-1 : -1) : r[0] - 1; /* left */
1108: neighborRank[3][1] = r[1] ;
1110: neighborRank[4][0] = r[0] ; /* */
1111: neighborRank[4][1] = r[1] ;
1113: neighborRank[5][0] = last[0] ? (per[0] ? 0 : -1) : r[0] + 1; /* right */
1114: neighborRank[5][1] = r[1] ;
1116: neighborRank[6][0] = first[0] ? (per[0] ? n[0]-1 : -1) : r[0] - 1; /* left up */
1117: neighborRank[6][1] = last[1] ? (per[1] ? 0 : -1) : r[1] + 1;
1119: neighborRank[7][0] = r[0] ; /* up */
1120: neighborRank[7][1] = last[1] ? (per[1] ? 0 : -1) : r[1] + 1;
1122: neighborRank[8][0] = last[0] ? (per[0] ? 0 : -1) : r[0] + 1; /* right up */
1123: neighborRank[8][1] = last[1] ? (per[1] ? 0 : -1) : r[1] + 1;
1125: /* Then, compute the rank of each in the linear ordering */
1126: PetscMalloc1(9,&stag->neighbors);
1127: for (i=0; i<9; ++i){
1128: if (neighborRank[i][0] >= 0 && neighborRank[i][1] >=0) {
1129: stag->neighbors[i] = neighborRank[i][0] + n[0]*neighborRank[i][1];
1130: } else {
1131: stag->neighbors[i] = -1;
1132: }
1133: }
1135: return(0);
1136: }
1138: static PetscErrorCode DMStagSetUpBuildGlobalOffsets_2d(DM dm,PetscInt **pGlobalOffsets)
1139: {
1140: PetscErrorCode ierr;
1141: const DM_Stag * const stag = (DM_Stag*)dm->data;
1142: PetscInt *globalOffsets;
1143: PetscInt i,j,d,entriesPerEdge,count;
1144: PetscMPIInt size;
1145: PetscBool extra[2];
1148: MPI_Comm_size(PetscObjectComm((PetscObject)dm),&size);
1149: for (d=0; d<2; ++d) extra[d] = (PetscBool)(stag->boundaryType[d] != DM_BOUNDARY_PERIODIC); /* Extra points in global rep */
1150: entriesPerEdge = stag->dof[0] + stag->dof[1];
1151: PetscMalloc1(size,pGlobalOffsets);
1152: globalOffsets = *pGlobalOffsets;
1153: globalOffsets[0] = 0;
1154: count = 1; /* note the count is offset by 1 here. We add the size of the previous rank */
1155: for (j=0; j<stag->nRanks[1]-1; ++j) {
1156: const PetscInt nnj = stag->l[1][j];
1157: for (i=0; i<stag->nRanks[0]-1; ++i) {
1158: const PetscInt nni = stag->l[0][i];
1159: globalOffsets[count] = globalOffsets[count-1] + nnj*nni*stag->entriesPerElement; /* No right/top/front boundaries */
1160: ++count;
1161: }
1162: {
1163: /* i = stag->nRanks[0]-1; */
1164: const PetscInt nni = stag->l[0][i];
1165: globalOffsets[count] = globalOffsets[count-1] + nnj*nni*stag->entriesPerElement
1166: + (extra[0] ? nnj*entriesPerEdge : 0); /* Extra edges on the right */
1167: ++count;
1168: }
1169: }
1170: {
1171: /* j = stag->nRanks[1]-1; */
1172: const PetscInt nnj = stag->l[1][j];
1173: for (i=0; i<stag->nRanks[0]-1; ++i) {
1174: const PetscInt nni = stag->l[0][i];
1175: globalOffsets[count] = globalOffsets[count-1] + nni*nnj*stag->entriesPerElement
1176: + (extra[1] ? nni*entriesPerEdge : 0); /* Extra edges on the top */
1177: ++count;
1178: }
1179: /* Don't need to compute entries in last element */
1180: }
1181: return(0);
1182: }
1184: static PetscErrorCode DMStagComputeLocationOffsets_2d(DM dm)
1185: {
1186: PetscErrorCode ierr;
1187: DM_Stag * const stag = (DM_Stag*)dm->data;
1188: const PetscInt epe = stag->entriesPerElement;
1189: const PetscInt epr = stag->nGhost[0]*epe;
1192: PetscMalloc1(DMSTAG_NUMBER_LOCATIONS,&stag->locationOffsets);
1193: stag->locationOffsets[DMSTAG_DOWN_LEFT] = 0;
1194: stag->locationOffsets[DMSTAG_DOWN] = stag->locationOffsets[DMSTAG_DOWN_LEFT] + stag->dof[0];
1195: stag->locationOffsets[DMSTAG_DOWN_RIGHT] = stag->locationOffsets[DMSTAG_DOWN_LEFT] + epe;
1196: stag->locationOffsets[DMSTAG_LEFT] = stag->locationOffsets[DMSTAG_DOWN] + stag->dof[1];
1197: stag->locationOffsets[DMSTAG_ELEMENT] = stag->locationOffsets[DMSTAG_LEFT] + stag->dof[1];
1198: stag->locationOffsets[DMSTAG_RIGHT] = stag->locationOffsets[DMSTAG_LEFT] + epe;
1199: stag->locationOffsets[DMSTAG_UP_LEFT] = stag->locationOffsets[DMSTAG_DOWN_LEFT] + epr;
1200: stag->locationOffsets[DMSTAG_UP] = stag->locationOffsets[DMSTAG_DOWN] + epr;
1201: stag->locationOffsets[DMSTAG_UP_RIGHT] = stag->locationOffsets[DMSTAG_UP_LEFT] + epe;
1202: return(0);
1203: }
1205: PETSC_INTERN PetscErrorCode DMStagPopulateLocalToGlobalInjective_2d(DM dm)
1206: {
1207: PetscErrorCode ierr;
1208: DM_Stag * const stag = (DM_Stag*)dm->data;
1209: PetscInt *idxLocal,*idxGlobal,*globalOffsetsRecomputed;
1210: const PetscInt *globalOffsets;
1211: PetscInt i,j,d,count,entriesPerCorner,entriesPerEdge,entriesPerElementRowGhost,entriesPerElementRow,ghostOffsetStart[2];
1212: IS isLocal,isGlobal;
1213: PetscBool dummyEnd[2];
1216: DMStagSetUpBuildGlobalOffsets_2d(dm,&globalOffsetsRecomputed); /* note that we don't actually use all of these. An available optimization is to pass them, when available */
1217: globalOffsets = globalOffsetsRecomputed;
1218: PetscMalloc1(stag->entries,&idxLocal);
1219: PetscMalloc1(stag->entries,&idxGlobal);
1220: for (d=0; d<2; ++d) dummyEnd[d] = (PetscBool)(stag->lastRank[d] && stag->boundaryType[d] != DM_BOUNDARY_PERIODIC);
1221: entriesPerCorner = stag->dof[0];
1222: entriesPerEdge = stag->dof[0] + stag->dof[1];
1223: entriesPerElementRow = stag->n[0] *stag->entriesPerElement + (dummyEnd[0] ? entriesPerEdge : 0);
1224: entriesPerElementRowGhost = stag->nGhost[0]*stag->entriesPerElement;
1225: count = 0;
1226: for (d=0; d<2; ++d) ghostOffsetStart[d] = stag->start[d] - stag->startGhost[d];
1227: {
1228: const PetscInt neighbor = 4;
1229: const PetscInt globalOffset = globalOffsets[stag->neighbors[neighbor]];
1230: for (j=0; j<stag->n[1]; ++j) {
1231: const PetscInt jghost = j + ghostOffsetStart[1];
1232: for (i=0; i<stag->n[0]; ++i) {
1233: const PetscInt ighost = i + ghostOffsetStart[0];
1234: for (d=0; d<stag->entriesPerElement; ++d, ++count) {
1235: idxGlobal[count] = globalOffset + j *entriesPerElementRow + i *stag->entriesPerElement + d;
1236: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
1237: }
1238: }
1239: if (dummyEnd[0]) {
1240: const PetscInt ighost = i + ghostOffsetStart[0];
1241: i = stag->n[0];
1242: for (d=0; d<stag->dof[0]; ++d, ++count) { /* vertex first */
1243: idxGlobal[count] = globalOffset + j *entriesPerElementRow + i *stag->entriesPerElement + d;
1244: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
1245: }
1246: for (d=0; d<stag->dof[1]; ++d, ++count) { /* then left ege (skipping bottom edge) */
1247: idxGlobal[count] = globalOffset + j *entriesPerElementRow + i *stag->entriesPerElement + stag->dof[0] + d;
1248: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + stag->dof[0] + stag->dof[1] + d;
1249: }
1250: }
1251: }
1252: if (dummyEnd[1]) {
1253: const PetscInt jghost = j + ghostOffsetStart[1];
1254: j = stag->n[1];
1255: for (i=0; i<stag->n[0]; ++i) {
1256: const PetscInt ighost = i + ghostOffsetStart[0];
1257: for (d=0; d<entriesPerEdge; ++d, ++count) { /* vertex and bottom edge (which are the first entries) */
1258: idxGlobal[count] = globalOffset + j *entriesPerElementRow + i*entriesPerEdge + d; /* note i increment by entriesPerEdge */
1259: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
1260: }
1261: }
1262: if (dummyEnd[0]) {
1263: const PetscInt ighost = i + ghostOffsetStart[0];
1264: i = stag->n[0];
1265: for (d=0; d<entriesPerCorner; ++d, ++count) { /* vertex only */
1266: idxGlobal[count] = globalOffset + j *entriesPerElementRow + i *entriesPerEdge + d; /* note i increment by entriesPerEdge */
1267: idxLocal[count] = jghost*entriesPerElementRowGhost + ighost*stag->entriesPerElement + d;
1268: }
1269: }
1270: }
1271: }
1272: ISCreateGeneral(PetscObjectComm((PetscObject)dm),stag->entries,idxLocal,PETSC_OWN_POINTER,&isLocal);
1273: ISCreateGeneral(PetscObjectComm((PetscObject)dm),stag->entries,idxGlobal,PETSC_OWN_POINTER,&isGlobal);
1274: {
1275: Vec local,global;
1276: VecCreateMPIWithArray(PetscObjectComm((PetscObject)dm),1,stag->entries,PETSC_DECIDE,NULL,&global);
1277: VecCreateSeqWithArray(PETSC_COMM_SELF,stag->entriesPerElement,stag->entriesGhost,NULL,&local);
1278: VecScatterCreate(local,isLocal,global,isGlobal,&stag->ltog_injective);
1279: VecDestroy(&global);
1280: VecDestroy(&local);
1281: }
1282: ISDestroy(&isLocal);
1283: ISDestroy(&isGlobal);
1284: if (globalOffsetsRecomputed) {
1285: PetscFree(globalOffsetsRecomputed);
1286: }
1287: return(0);
1288: }