Actual source code: vecimpl.h

petsc-3.7.6 2017-04-24
Report Typos and Errors
  2: /*
  3:    This private file should not be included in users' code.
  4:    Defines the fields shared by all vector implementations.

  6: */

  8: #ifndef __VECIMPL_H

 11: #include <petscvec.h>
 12: #include <petsc/private/petscimpl.h>
 13: #include <petscviewer.h>

 15: PETSC_EXTERN PetscBool VecRegisterAllCalled;
 16: PETSC_EXTERN PetscErrorCode VecRegisterAll(void);

 18: /* ----------------------------------------------------------------------------*/

 20: typedef struct _VecOps *VecOps;
 21: struct _VecOps {
 22:   PetscErrorCode (*duplicate)(Vec,Vec*);         /* get single vector */
 23:   PetscErrorCode (*duplicatevecs)(Vec,PetscInt,Vec**);     /* get array of vectors */
 24:   PetscErrorCode (*destroyvecs)(PetscInt,Vec[]);           /* free array of vectors */
 25:   PetscErrorCode (*dot)(Vec,Vec,PetscScalar*);             /* z = x^H * y */
 26:   PetscErrorCode (*mdot)(Vec,PetscInt,const Vec[],PetscScalar*); /* z[j] = x dot y[j] */
 27:   PetscErrorCode (*norm)(Vec,NormType,PetscReal*);        /* z = sqrt(x^H * x) */
 28:   PetscErrorCode (*tdot)(Vec,Vec,PetscScalar*);             /* x'*y */
 29:   PetscErrorCode (*mtdot)(Vec,PetscInt,const Vec[],PetscScalar*);/* z[j] = x dot y[j] */
 30:   PetscErrorCode (*scale)(Vec,PetscScalar);                 /* x = alpha * x   */
 31:   PetscErrorCode (*copy)(Vec,Vec);                     /* y = x */
 32:   PetscErrorCode (*set)(Vec,PetscScalar);                        /* y = alpha  */
 33:   PetscErrorCode (*swap)(Vec,Vec);                               /* exchange x and y */
 34:   PetscErrorCode (*axpy)(Vec,PetscScalar,Vec);                   /* y = y + alpha * x */
 35:   PetscErrorCode (*axpby)(Vec,PetscScalar,PetscScalar,Vec);      /* y = alpha * x + beta * y*/
 36:   PetscErrorCode (*maxpy)(Vec,PetscInt,const PetscScalar*,Vec*); /* y = y + alpha[j] x[j] */
 37:   PetscErrorCode (*aypx)(Vec,PetscScalar,Vec);                   /* y = x + alpha * y */
 38:   PetscErrorCode (*waxpy)(Vec,PetscScalar,Vec,Vec);         /* w = y + alpha * x */
 39:   PetscErrorCode (*axpbypcz)(Vec,PetscScalar,PetscScalar,PetscScalar,Vec,Vec);   /* z = alpha * x + beta *y + gamma *z*/
 40:   PetscErrorCode (*pointwisemult)(Vec,Vec,Vec);        /* w = x .* y */
 41:   PetscErrorCode (*pointwisedivide)(Vec,Vec,Vec);      /* w = x ./ y */
 42:   PetscErrorCode (*setvalues)(Vec,PetscInt,const PetscInt[],const PetscScalar[],InsertMode);
 43:   PetscErrorCode (*assemblybegin)(Vec);                /* start global assembly */
 44:   PetscErrorCode (*assemblyend)(Vec);                  /* end global assembly */
 45:   PetscErrorCode (*getarray)(Vec,PetscScalar**);            /* get data array */
 46:   PetscErrorCode (*getsize)(Vec,PetscInt*);
 47:   PetscErrorCode (*getlocalsize)(Vec,PetscInt*);
 48:   PetscErrorCode (*restorearray)(Vec,PetscScalar**);        /* restore data array */
 49:   PetscErrorCode (*max)(Vec,PetscInt*,PetscReal*);      /* z = max(x); idx=index of max(x) */
 50:   PetscErrorCode (*min)(Vec,PetscInt*,PetscReal*);      /* z = min(x); idx=index of min(x) */
 51:   PetscErrorCode (*setrandom)(Vec,PetscRandom);         /* set y[j] = random numbers */
 52:   PetscErrorCode (*setoption)(Vec,VecOption,PetscBool );
 53:   PetscErrorCode (*setvaluesblocked)(Vec,PetscInt,const PetscInt[],const PetscScalar[],InsertMode);
 54:   PetscErrorCode (*destroy)(Vec);
 55:   PetscErrorCode (*view)(Vec,PetscViewer);
 56:   PetscErrorCode (*placearray)(Vec,const PetscScalar*);     /* place data array */
 57:   PetscErrorCode (*replacearray)(Vec,const PetscScalar*);     /* replace data array */
 58:   PetscErrorCode (*dot_local)(Vec,Vec,PetscScalar*);
 59:   PetscErrorCode (*tdot_local)(Vec,Vec,PetscScalar*);
 60:   PetscErrorCode (*norm_local)(Vec,NormType,PetscReal*);
 61:   PetscErrorCode (*mdot_local)(Vec,PetscInt,const Vec[],PetscScalar*);
 62:   PetscErrorCode (*mtdot_local)(Vec,PetscInt,const Vec[],PetscScalar*);
 63:   PetscErrorCode (*load)(Vec,PetscViewer);
 64:   PetscErrorCode (*reciprocal)(Vec);
 65:   PetscErrorCode (*conjugate)(Vec);
 66:   PetscErrorCode (*setlocaltoglobalmapping)(Vec,ISLocalToGlobalMapping);
 67:   PetscErrorCode (*setvalueslocal)(Vec,PetscInt,const PetscInt *,const PetscScalar *,InsertMode);
 68:   PetscErrorCode (*resetarray)(Vec);      /* vector points to its original array, i.e. undoes any VecPlaceArray() */
 69:   PetscErrorCode (*setfromoptions)(PetscOptionItems*,Vec);
 70:   PetscErrorCode (*maxpointwisedivide)(Vec,Vec,PetscReal*);      /* m = max abs(x ./ y) */
 71:   PetscErrorCode (*pointwisemax)(Vec,Vec,Vec);
 72:   PetscErrorCode (*pointwisemaxabs)(Vec,Vec,Vec);
 73:   PetscErrorCode (*pointwisemin)(Vec,Vec,Vec);
 74:   PetscErrorCode (*getvalues)(Vec,PetscInt,const PetscInt[],PetscScalar[]);
 75:   PetscErrorCode (*sqrt)(Vec);
 76:   PetscErrorCode (*abs)(Vec);
 77:   PetscErrorCode (*exp)(Vec);
 78:   PetscErrorCode (*log)(Vec);
 79:   PetscErrorCode (*shift)(Vec,PetscScalar);
 80:   PetscErrorCode (*create)(Vec);
 81:   PetscErrorCode (*stridegather)(Vec,PetscInt,Vec,InsertMode);
 82:   PetscErrorCode (*stridescatter)(Vec,PetscInt,Vec,InsertMode);
 83:   PetscErrorCode (*dotnorm2)(Vec,Vec,PetscScalar*,PetscScalar*);
 84:   PetscErrorCode (*getsubvector)(Vec,IS,Vec*);
 85:   PetscErrorCode (*restoresubvector)(Vec,IS,Vec*);
 86:   PetscErrorCode (*getarrayread)(Vec,const PetscScalar**);
 87:   PetscErrorCode (*restorearrayread)(Vec,const PetscScalar**);
 88:   PetscErrorCode (*stridesubsetgather)(Vec,PetscInt,const PetscInt[],const PetscInt[],Vec,InsertMode);
 89:   PetscErrorCode (*stridesubsetscatter)(Vec,PetscInt,const PetscInt[],const PetscInt[],Vec,InsertMode);
 90:   PetscErrorCode (*viewnative)(Vec,PetscViewer);
 91:   PetscErrorCode (*loadnative)(Vec,PetscViewer);
 92:   PetscErrorCode (*getlocalvector)(Vec,Vec);
 93:   PetscErrorCode (*restorelocalvector)(Vec,Vec);
 94:   PetscErrorCode (*getlocalvectorread)(Vec,Vec);
 95:   PetscErrorCode (*restorelocalvectorread)(Vec,Vec);
 96: };

 98: /*
 99:     The stash is used to temporarily store inserted vec values that
100:   belong to another processor. During the assembly phase the stashed
101:   values are moved to the correct processor and
102: */

104: typedef struct {
105:   PetscInt      nmax;                   /* maximum stash size */
106:   PetscInt      umax;                   /* max stash size user wants */
107:   PetscInt      oldnmax;                /* the nmax value used previously */
108:   PetscInt      n;                      /* stash size */
109:   PetscInt      bs;                     /* block size of the stash */
110:   PetscInt      reallocs;               /* preserve the no of mallocs invoked */
111:   PetscInt      *idx;                   /* global row numbers in stash */
112:   PetscScalar   *array;                 /* array to hold stashed values */
113:   /* The following variables are used for communication */
114:   MPI_Comm      comm;
115:   PetscMPIInt   size,rank;
116:   PetscMPIInt   tag1,tag2;
117:   MPI_Request   *send_waits;            /* array of send requests */
118:   MPI_Request   *recv_waits;            /* array of receive requests */
119:   MPI_Status    *send_status;           /* array of send status */
120:   PetscInt      nsends,nrecvs;          /* numbers of sends and receives */
121:   PetscScalar   *svalues,*rvalues;      /* sending and receiving data */
122:   PetscInt      *sindices,*rindices;
123:   PetscInt      rmax;                   /* maximum message length */
124:   PetscInt      *nprocs;                /* tmp data used both during scatterbegin and end */
125:   PetscInt      nprocessed;             /* number of messages already processed */
126:   PetscBool     donotstash;
127:   PetscBool     ignorenegidx;           /* ignore negative indices passed into VecSetValues/VetGetValues */
128:   InsertMode    insertmode;
129:   PetscInt      *bowners;
130: } VecStash;

132: struct _p_Vec {
133:   PETSCHEADER(struct _VecOps);
134:   PetscLayout            map;
135:   void                   *data;     /* implementation-specific data */
136:   PetscBool              array_gotten;
137:   VecStash               stash,bstash; /* used for storing off-proc values during assembly */
138:   PetscBool              petscnative;  /* means the ->data starts with VECHEADER and can use VecGetArrayFast()*/
139:   PetscInt               lock;   /* vector is locked to read only */
140: #if defined(PETSC_HAVE_CUSP)
141:   PetscCUSPFlag          valid_GPU_array;    /* indicates where the most recently modified vector data is (GPU or CPU) */
142:   void                   *spptr; /* if we're using CUSP, then this is the special pointer to the array on the GPU */
143: #elif defined(PETSC_HAVE_VIENNACL)
144:   PetscViennaCLFlag      valid_GPU_array;    /* indicates where the most recently modified vector data is (GPU or CPU) */
145:   void                   *spptr; /* if we're using ViennaCL, then this is the special pointer to the array on the GPU */
146: #elif defined(PETSC_HAVE_VECCUDA)
147:   PetscCUDAFlag          valid_GPU_array;    /* indicates where the most recently modified vector data is (GPU or CPU) */
148:   void                   *spptr; /* if we're using CUDA, then this is the special pointer to the array on the GPU */
149: #endif
150: };

152: PETSC_EXTERN PetscLogEvent VEC_View, VEC_Max, VEC_Min, VEC_DotBarrier, VEC_Dot, VEC_MDotBarrier, VEC_MDot, VEC_TDot, VEC_MTDot;
153: PETSC_EXTERN PetscLogEvent VEC_Norm, VEC_Normalize, VEC_Scale, VEC_Copy, VEC_Set, VEC_AXPY, VEC_AYPX, VEC_WAXPY, VEC_MAXPY;
154: PETSC_EXTERN PetscLogEvent VEC_AssemblyEnd, VEC_PointwiseMult, VEC_SetValues, VEC_Load, VEC_ScatterBarrier, VEC_ScatterBegin, VEC_ScatterEnd;
155: PETSC_EXTERN PetscLogEvent VEC_SetRandom, VEC_ReduceArithmetic, VEC_ReduceBarrier, VEC_ReduceCommunication;
156: PETSC_EXTERN PetscLogEvent VEC_ReduceBegin,VEC_ReduceEnd;
157: PETSC_EXTERN PetscLogEvent VEC_Swap, VEC_AssemblyBegin, VEC_NormBarrier, VEC_DotNormBarrier, VEC_DotNorm, VEC_AXPBYPCZ, VEC_Ops;
158: PETSC_EXTERN PetscLogEvent VEC_CUSPCopyToGPU, VEC_CUSPCopyFromGPU;
159: PETSC_EXTERN PetscLogEvent VEC_CUSPCopyToGPUSome, VEC_CUSPCopyFromGPUSome;
160: PETSC_EXTERN PetscLogEvent VEC_ViennaCLCopyToGPU,     VEC_ViennaCLCopyFromGPU;
161: PETSC_EXTERN PetscLogEvent VEC_CUDACopyToGPU, VEC_CUDACopyFromGPU;
162: PETSC_EXTERN PetscLogEvent VEC_CUDACopyToGPUSome, VEC_CUDACopyFromGPUSome;

164: PETSC_EXTERN PetscErrorCode VecView_Seq(Vec,PetscViewer);
165: #if defined(PETSC_HAVE_CUSP)
166: PETSC_EXTERN PetscErrorCode VecCUSPAllocateCheckHost(Vec v);
167: PETSC_EXTERN PetscErrorCode VecCUSPCopyFromGPU(Vec v);
168: #elif defined(PETSC_HAVE_VIENNACL)
169: PETSC_EXTERN PetscErrorCode VecViennaCLAllocateCheckHost(Vec v);
170: PETSC_EXTERN PetscErrorCode VecViennaCLCopyFromGPU(Vec v);
171: #elif defined(PETSC_HAVE_VECCUDA)
172: PETSC_EXTERN PetscErrorCode VecCUDAAllocateCheckHost(Vec v);
173: PETSC_EXTERN PetscErrorCode VecCUDACopyFromGPU(Vec v);
174: #endif


177: /*
178:      Common header shared by array based vectors,
179:    currently Vec_Seq and Vec_MPI
180: */
181: #define VECHEADER                          \
182:   PetscScalar *array;                      \
183:   PetscScalar *array_allocated;                        /* if the array was allocated by PETSc this is its pointer */  \
184:   PetscScalar *unplacedarray;                           /* if one called VecPlaceArray(), this is where it stashed the original */

186: /* Default obtain and release vectors; can be used by any implementation */
187: PETSC_INTERN PetscErrorCode VecDuplicateVecs_Default(Vec,PetscInt,Vec *[]);
188: PETSC_INTERN PetscErrorCode VecDestroyVecs_Default(PetscInt,Vec []);
189: PETSC_INTERN PetscErrorCode VecLoad_Binary(Vec, PetscViewer);
190: PETSC_EXTERN PetscErrorCode VecLoad_Default(Vec, PetscViewer);

192: PETSC_EXTERN PetscInt  NormIds[7];  /* map from NormType to IDs used to cache/retreive values of norms */

194: /* --------------------------------------------------------------------*/
195: /*                                                                     */
196: /* Defines the data structures used in the Vec Scatter operations      */

198: typedef enum { VEC_SCATTER_SEQ_GENERAL,VEC_SCATTER_SEQ_STRIDE,
199:                VEC_SCATTER_MPI_GENERAL,VEC_SCATTER_MPI_TOALL,
200:                VEC_SCATTER_MPI_TOONE} VecScatterType;

202: #define VECSCATTER_IMPL_HEADER \
203:       VecScatterType type;

205: typedef struct {
206:   VECSCATTER_IMPL_HEADER
207: } VecScatter_Common;

209: /*
210:    These scatters are for the purely local case.
211: */
212: typedef struct {
213:   VECSCATTER_IMPL_HEADER
214:   PetscInt       n;                    /* number of components to scatter */
215:   PetscInt       *vslots;              /* locations of components */
216:   /*
217:        The next three fields are used in parallel scatters, they contain
218:        optimization in the special case that the "to" vector and the "from"
219:        vector are the same, so one only needs copy components that truly
220:        copies instead of just y[idx[i]] = y[jdx[i]] where idx[i] == jdx[i].
221:   */
222:   PetscBool      nonmatching_computed;
223:   PetscInt       n_nonmatching;        /* number of "from"s  != "to"s */
224:   PetscInt       *slots_nonmatching;   /* locations of "from"s  != "to"s */
225:   PetscBool      is_copy;
226:   PetscInt       copy_start;   /* local scatter is a copy starting at copy_start */
227:   PetscInt       copy_length;
228: } VecScatter_Seq_General;

230: typedef struct {
231:   VECSCATTER_IMPL_HEADER
232:   PetscInt       n;
233:   PetscInt       first;
234:   PetscInt       step;
235: } VecScatter_Seq_Stride;

237: /*
238:    This scatter is for a global vector copied (completely) to each processor (or all to one)
239: */
240: typedef struct {
241:   VECSCATTER_IMPL_HEADER
242:   PetscMPIInt    *count;        /* elements of vector on each processor */
243:   PetscMPIInt    *displx;
244:   PetscScalar    *work1;
245:   PetscScalar    *work2;
246: } VecScatter_MPI_ToAll;

248: /*
249:    This is the general parallel scatter
250: */
251: typedef struct {
252:   VECSCATTER_IMPL_HEADER
253:   PetscInt               n;        /* number of processors to send/receive */
254:   PetscInt               *starts;  /* starting point in indices and values for each proc*/
255:   PetscInt               *indices; /* list of all components sent or received */
256:   PetscMPIInt            *procs;   /* processors we are communicating with in scatter */
257:   MPI_Request            *requests,*rev_requests;
258:   PetscScalar            *values;  /* buffer for all sends or receives */
259:   VecScatter_Seq_General local;    /* any part that happens to be local */
260:   MPI_Status             *sstatus,*rstatus;
261:   PetscBool              use_readyreceiver;
262:   PetscInt               bs;
263:   PetscBool              sendfirst;
264:   PetscBool              contiq;
265:   /* for MPI_Alltoallv() approach */
266:   PetscBool              use_alltoallv;
267:   PetscMPIInt            *counts,*displs;
268:   /* for MPI_Alltoallw() approach */
269:   PetscBool              use_alltoallw;
270: #if defined(PETSC_HAVE_MPI_ALLTOALLW)
271:   PetscMPIInt            *wcounts,*wdispls;
272:   MPI_Datatype           *types;
273: #endif
274:   PetscBool              use_window;
275: #if defined(PETSC_HAVE_MPI_WIN_CREATE)
276:   MPI_Win                window;
277:   PetscInt               *winstarts;    /* displacements in the processes I am putting to */
278: #endif
279: } VecScatter_MPI_General;


282: PETSC_INTERN PetscErrorCode VecScatterGetTypes_Private(VecScatter,VecScatterType*,VecScatterType*);
283: PETSC_INTERN PetscErrorCode VecScatterIsSequential_Private(VecScatter_Common*,PetscBool*);

285: typedef struct _VecScatterOps *VecScatterOps;
286: struct _VecScatterOps {
287:   PetscErrorCode (*begin)(VecScatter,Vec,Vec,InsertMode,ScatterMode);
288:   PetscErrorCode (*end)(VecScatter,Vec,Vec,InsertMode,ScatterMode);
289:   PetscErrorCode (*copy)(VecScatter,VecScatter);
290:   PetscErrorCode (*destroy)(VecScatter);
291:   PetscErrorCode (*view)(VecScatter,PetscViewer);
292:   PetscErrorCode (*viewfromoptions)(VecScatter,const char prefix[],const char name[]);
293:   PetscErrorCode (*remap)(VecScatter,PetscInt *,PetscInt*);
294:   PetscErrorCode (*getmerged)(VecScatter,PetscBool *);
295: };

297: struct _p_VecScatter {
298:   PETSCHEADER(struct _VecScatterOps);
299:   PetscInt       to_n,from_n;
300:   PetscBool      inuse;                /* prevents corruption from mixing two scatters */
301:   PetscBool      beginandendtogether;  /* indicates that the scatter begin and end  function are called together, VecScatterEnd()
302:                                           is then treated as a nop */
303:   PetscBool      packtogether;         /* packs all the messages before sending, same with receive */
304:   PetscBool      reproduce;            /* always receive the ghost points in the same order of processes */
305:   void           *fromdata,*todata;
306:   void           *spptr;
307: };

309: PETSC_INTERN PetscErrorCode VecStashCreate_Private(MPI_Comm,PetscInt,VecStash*);
310: PETSC_INTERN PetscErrorCode VecStashDestroy_Private(VecStash*);
311: PETSC_INTERN PetscErrorCode VecStashExpand_Private(VecStash*,PetscInt);
312: PETSC_INTERN PetscErrorCode VecStashScatterEnd_Private(VecStash*);
313: PETSC_INTERN PetscErrorCode VecStashSetInitialSize_Private(VecStash*,PetscInt);
314: PETSC_INTERN PetscErrorCode VecStashGetInfo_Private(VecStash*,PetscInt*,PetscInt*);
315: PETSC_INTERN PetscErrorCode VecStashScatterBegin_Private(VecStash*,PetscInt*);
316: PETSC_INTERN PetscErrorCode VecStashScatterGetMesg_Private(VecStash*,PetscMPIInt*,PetscInt**,PetscScalar**,PetscInt*);
317: PETSC_INTERN PetscErrorCode VecStashSortCompress_Private(VecStash*);
318: PETSC_INTERN PetscErrorCode VecStashGetOwnerList_Private(VecStash*,PetscLayout,PetscMPIInt*,PetscMPIInt**);

320: /*
321:   VecStashValue_Private - inserts a single value into the stash.

323:   Input Parameters:
324:   stash  - the stash
325:   idx    - the global of the inserted value
326:   values - the value inserted
327: */
328: PETSC_STATIC_INLINE PetscErrorCode VecStashValue_Private(VecStash *stash,PetscInt row,PetscScalar value)
329: {
331:   /* Check and see if we have sufficient memory */
332:   if (((stash)->n + 1) > (stash)->nmax) {
333:     VecStashExpand_Private(stash,1);
334:   }
335:   (stash)->idx[(stash)->n]   = row;
336:   (stash)->array[(stash)->n] = value;
337:   (stash)->n++;
338:   return 0;
339: }

341: /*
342:   VecStashValuesBlocked_Private - inserts 1 block of values into the stash.

344:   Input Parameters:
345:   stash  - the stash
346:   idx    - the global block index
347:   values - the values inserted
348: */
349: PETSC_STATIC_INLINE PetscErrorCode VecStashValuesBlocked_Private(VecStash *stash,PetscInt row,PetscScalar *values)
350: {
351:   PetscInt       jj,stash_bs=(stash)->bs;
352:   PetscScalar    *array;
354:   if (((stash)->n+1) > (stash)->nmax) {
355:     VecStashExpand_Private(stash,1);
356:   }
357:   array = (stash)->array + stash_bs*(stash)->n;
358:   (stash)->idx[(stash)->n]   = row;
359:   for (jj=0; jj<stash_bs; jj++) { array[jj] = values[jj];}
360:   (stash)->n++;
361:   return 0;
362: }

364: PETSC_INTERN PetscErrorCode VecStrideGather_Default(Vec,PetscInt,Vec,InsertMode);
365: PETSC_INTERN PetscErrorCode VecStrideScatter_Default(Vec,PetscInt,Vec,InsertMode);
366: PETSC_INTERN PetscErrorCode VecReciprocal_Default(Vec);
367: PETSC_INTERN PetscErrorCode VecStrideSubSetGather_Default(Vec,PetscInt,const PetscInt[],const PetscInt[],Vec,InsertMode);
368: PETSC_INTERN PetscErrorCode VecStrideSubSetScatter_Default(Vec,PetscInt,const PetscInt[],const PetscInt[],Vec,InsertMode);

370: #if defined(PETSC_HAVE_MATLAB_ENGINE)
371: PETSC_EXTERN PetscErrorCode VecMatlabEnginePut_Default(PetscObject,void*);
372: PETSC_EXTERN PetscErrorCode VecMatlabEngineGet_Default(PetscObject,void*);
373: #endif

375: PETSC_EXTERN PetscErrorCode PetscSectionGetField_Internal(PetscSection, PetscSection, Vec, PetscInt, PetscInt, PetscInt, IS *, Vec *);
376: PETSC_EXTERN PetscErrorCode PetscSectionRestoreField_Internal(PetscSection, PetscSection, Vec, PetscInt, PetscInt, PetscInt, IS *, Vec *);

378: /* Reset __FUNCT__ in case the user does not define it themselves */

382: #endif