a01283_source.html

/*! @file ParabolicFunctionNC2Stage_GPU.cu
    @author Youngdae Kim
    @brief Evaluate the parabolic term using a 2-stage finite difference discretization.
*/

#include <basic_gpu.h>
#include <arrayfunctions_gpu.h>
#include <mpivars.h>
#include <hypar.h>

/*! Kernel for ParabolicFunctionNC2Stage_GPU() */
__global__
void ParabolicFunctionNC2Stage_kernel(
    int ngrid_points,
    int ghosts,
    int d1,
    int d2,
    int ndims,
    int nvars,
    const int *dim,
    const double *dxinv,
    const double *Deriv2,
    double *par
)
{
    int tx = threadIdx.x + (blockDim.x * blockIdx.x);
    if (tx < ngrid_points) {
        int p, v;
        int index[GPU_MAX_NDIMS];
        double dxinv1, dxinv2;

        _ArrayIndexnD_(ndims,tx,dim,index,0);
        _ArrayIndex1D_(ndims,dim,index,ghosts,p);
        _GetCoordinate_(d1,index[d1],dim,ghosts,dxinv,dxinv1);
        _GetCoordinate_(d2,index[d2],dim,ghosts,dxinv,dxinv2);
        for (v=0; v<nvars; v++) par[nvars*p+v] += (dxinv1*dxinv2 * Deriv2[nvars*p+v]);
    }

    return;
}

/*! Evaluate the parabolic term using a "1.5"-stage finite-difference spatial discretization:
    The parabolic term is assumed to be of the form:
    \f{equation}{
      {\bf P}\left({\bf u}\right) = \sum_{d1=0}^{D-1}\sum_{d2=0}^{D-1} \frac {\partial^2 h_{d1,d2}\left(\bf u\right)} {\partial x_{d1} \partial x_{d2}},
    \f}
    where \f$d1\f$ and \f$d2\f$ are spatial dimension indices, and \f$D\f$ is the total number of spatial dimensions (#HyPar::ndims). This term is
    discretized at a grid point as:
    \f{equation}{
      \left.{\bf P}\left({\bf u}\right)\right|_j = \sum_{d1=0}^{D-1} \sum_{d2=0}^{D-1} \frac { \mathcal{D}_{d1}\mathcal{D}_{d2} \left[ {\bf h}_{d1,d2} \right] } {\Delta x_{d1} \Delta x_{d2}},
    \f}
    where \f$\mathcal{D}\f$ denotes the finite-difference approximation to the first derivative. Each of the first derivative approximations are \f$\mathcal{D}_{d1}\f$ and \f$\mathcal{D}_{d2}\f$ are computed separately, and thus the cross-derivative is evaluated in two steps using #HyPar::FirstDerivativePar.

    \b Notes:
    + This form of the parabolic term \b does \b allow for cross-derivatives (\f$ d1 \ne d2 \f$).
    + A \f$n\f$-th order central approximation to the second derivative can be expressed as a
      conjugation of two \f$(n-1)\f$-th order approximations to the first
      derivative, one forward and one backward. Computing it this way avoids
      odd-even decoupling. Thus, where possible #HyPar::FirstDerivativePar should
      point to the function computing \f$(n-1)\f$-th order first derivative where \f$n\f$
      is the desired order. Currently, this is implemented only for \f$n=2\f$. For other values
      of \f$n\f$, the first derivative is also computed with a \f$n\f$-th order approximation.

    To use this form of the parabolic term:
    + specify \b "par_space_type" in solver.inp as \b "nonconservative-2stage" (#HyPar::spatial_type_par).
    + the physical model must specify \f${\bf h}_{d1,d2}\left({\bf u}\right)\f$ through #HyPar::HFunction.
*/
int ParabolicFunctionNC2Stage_GPU(
    double  *par, /*!< array to hold the computed parabolic term */
    double  *u,   /*!< solution */
    void    *s,   /*!< Solver object of type #HyPar */
    void    *m,   /*!< MPI object of type #MPIVariables */
    double  t     /*!< Current simulation time */
)
{
  HyPar         *solver = (HyPar*)        s;
  MPIVariables  *mpi    = (MPIVariables*) m;
  double        *Func   = solver->fluxC;
  double        *Deriv1 = solver->Deriv1;
  double        *Deriv2 = solver->Deriv2;
  int           d1, d2;
  _DECLARE_IERR_;

  int     ndims  = solver->ndims;
  int     nvars  = solver->nvars;
  int     ghosts = solver->ghosts;
  int     *dim   = solver->dim_local;
  int     size   = solver->npoints_local_wghosts;

  if (!solver->HFunction) return(0); /* zero parabolic terms */
  solver->count_par++;

  gpuArraySetValue(par, size*nvars, 0.0);

  int ngrid_points = 1; for (int i = 0; i < ndims; i++) ngrid_points *= dim[i];

  for (d1 = 0; d1 < ndims; d1++) {
    for (d2 = 0; d2 < ndims; d2++) {

      /* calculate the diffusion function */
      solver->HFunction(Func,u,d1,d2,solver,t);
      solver->FirstDerivativePar(Deriv1,Func  ,d1, 1,solver,mpi);
      MPIExchangeBoundariesnD(ndims,nvars,dim,ghosts,mpi,Deriv1);
      solver->FirstDerivativePar(Deriv2,Deriv1,d2,-1,solver,mpi);

      /* calculate the final term - second derivative of the diffusion function */
      int nblocks = (ngrid_points - 1) / GPU_THREADS_PER_BLOCK + 1;
      ParabolicFunctionNC2Stage_kernel<<<nblocks, GPU_THREADS_PER_BLOCK>>>(
          ghosts, d1, d2, ndims, nvars, ngrid_points,
          solver->gpu_dim_local, solver->gpu_dxinv, solver->Deriv2, par
      );

      /*
      done = 0; _ArraySetValue_(index,ndims,0);
      while (!done) {
        _ArrayIndex1D_(ndims,dim,index,ghosts,p);
        _GetCoordinate_(d1,index[d1],dim,ghosts,dxinv,dxinv1);
        _GetCoordinate_(d2,index[d2],dim,ghosts,dxinv,dxinv2);
        for (v=0; v<nvars; v++) par[nvars*p+v] += (dxinv1*dxinv2 * Deriv2[nvars*p+v]);
        _ArrayIncrementIndex_(ndims,dim,index,done);
      }
      */
    }
  }

  if (solver->flag_ib) _ArrayBlockMultiply_(par,solver->iblank,size,nvars);
  return(0);
}