Momentum Balance¶

The momentum balance is

\[\pder{u_i}{t} = P_i + A_i + D_{i1} + D_{i2} + D_{i3},\]

where \(P_i\) and \(A_i\) are the pressure-gradient terms:

\[P_i \equiv - \dmompre{i},\]

and the advective terms:

\[A_i \equiv - \dmomadv{i}{1} - \dmomadv{i}{2} - \dmomadv{i}{3},\]

respectively.

\(D_{ij}\) is the diffusive term involving spatial differentiation in the \(j\)-th direction:

\[D_{ij} \equiv \dmomdif{j}{i} \,\, (\text{no summation over}\,j).\]

See the spatial discretization.

The temporal discretization for each Runge-Kutta iteration leads to

\[ \begin{align}\begin{aligned}\Delta u_i & = \gamma^k \Delta t P_i^k + \alpha^k \Delta t \left( A_i^{k } + D_i^{k } \right) + \beta^k \Delta t \left( A_i^{k-1} + D_i^{k-1} \right),\\u_i^* & = u_i^k + \Delta u_i,\end{aligned}\end{align} \]

when all advective and diffusive terms are treated explicitly, while

\[ \begin{align}\begin{aligned}\newcommand{\lap}[2]{ {#2} \gamma^k \Delta t \frac{\sqrt{Pr}}{\sqrt{Ra}} \frac{1}{J} \dif{}{\gcs{#1}} \left( \frac{J}{\sfact{#1}} \frac{1}{\sfact{#1}} \dif{}{\gcs{#1}} \right) } \Delta u_i & = \gamma^k \Delta t P_i^k + \alpha^k \Delta t A_i^{k } + \beta^k \Delta t A_i^{k-1} + \gamma^k \Delta t \left( D_{i1}^k + D_{i2}^k + D_{i3}^k \right),\\u_i^* & = u_i^k + \left\{ 1 - \lap{3}{c} \right\}^{-1} \left\{ 1 - \lap{2}{c} \right\}^{-1} \left\{ 1 - \lap{1}{c} \right\}^{-1} \Delta u_i,\end{aligned}\end{align} \]

when diffusive terms are treated implicitly.

Although we obtain a new velocity field, this does not satisfy the incompressibility in general, which necessitates the additional procedure below.

SMAC method¶

In addition to the incompressibility constraint, we need to somehow update the pressure field as well, which we do not have any equation such as:

\[\pder{p}{t} = \cdots.\]

To overcome these issues, we adopt the Simplified Marker And Cell (SMAC) method (Amsden and Harlow, J. Comput. Phys. (6), 1970), which is a two-step method.

Prediction Step¶

In the first step (prediction step), momentum equation is integrated in time, without taking care of the mass conservation, as discussed above. Basically the procedure is identical to how we handle the temperature field. First, the explicit and implicit terms are calculated and stored to the corresponding buffers:

src/fluid/predict/ux.c¶

int compute_rhs_ux (
    const domain_t * domain,
    fluid_t * fluid
) {
  if (!laplacians.is_initialised) {
    if (0 != init_laplacians(domain)) {
      return 1;
    }
  }
  const double * restrict ux = fluid->ux.data;
  const double * restrict uy = fluid->uy.data;
#if NDIMS == 3
  const double * restrict uz = fluid->uz.data;
#endif
  const double * restrict  p = fluid-> p.data;
  const double * restrict  t = fluid-> t.data;
  // buffer for explicit terms
  double * restrict srca = fluid->srcux.alpha.data;
  // buffer for implicit terms
  double * restrict srcg = fluid->srcux.gamma.data;
  const double diffusivity = fluid_compute_momentum_diffusivity(fluid);
  // advective contributions, always explicit
  advection_x(domain, ux,     srca);
  advection_y(domain, ux, uy, srca);
#if NDIMS == 3
  advection_z(domain, ux, uz, srca);
#endif
  // pressure-gradient contribution, always implicit
  pressure(domain, p, srcg);
  // diffusive contributions, can be explicit or implicit
  diffusion_x(domain, diffusivity, ux, param_m_implicit_x ? srcg : srca);
  diffusion_y(domain, diffusivity, ux, param_m_implicit_y ? srcg : srca);
#if NDIMS == 3
  diffusion_z(domain, diffusivity, ux, param_m_implicit_z ? srcg : srca);
#endif
  // buoyancy contribution, always explicit
  buoyancy(domain, t, srca);
  return 0;
}

src/fluid/predict/uy.c¶

int compute_rhs_uy(
    const domain_t * domain,
    fluid_t * fluid
) {
  if (!laplacians.is_initialised) {
    if (0 != init_laplacians(domain)) {
      return 1;
    }
  }
  const double * restrict ux = fluid->ux.data;
  const double * restrict uy = fluid->uy.data;
#if NDIMS == 3
  const double * restrict uz = fluid->uz.data;
#endif
  const double * restrict  p = fluid-> p.data;
  // buffer for explicit terms
  double * restrict srca = fluid->srcuy.alpha.data;
  // buffer for implicit terms
  double * restrict srcg = fluid->srcuy.gamma.data;
  const double diffusivity = fluid_compute_momentum_diffusivity(fluid);
  // advective contributions, always explicit
  advection_x(domain, uy, ux, srca);
  advection_y(domain, uy,     srca);
#if NDIMS == 3
  advection_z(domain, uy, uz, srca);
#endif
  // pressure-gradient contribution, always implicit
  pressure(domain, p, srcg);
  // diffusive contributions, can be explicit or implicit
  diffusion_x(domain, diffusivity, uy, param_m_implicit_x ? srcg : srca);
  diffusion_y(domain, diffusivity, uy, param_m_implicit_y ? srcg : srca);
#if NDIMS == 3
  diffusion_z(domain, diffusivity, uy, param_m_implicit_z ? srcg : srca);
#endif
  return 0;
}

src/fluid/predict/uz.c¶

int compute_rhs_uz (
    const domain_t * domain,
    fluid_t * fluid
) {
  if (!laplacians.is_initialised) {
    if (0 != init_laplacians(domain)) {
      return 1;
    }
  }
  const double * restrict ux = fluid->ux.data;
  const double * restrict uy = fluid->uy.data;
  const double * restrict uz = fluid->uz.data;
  const double * restrict  p = fluid-> p.data;
  // buffer for explicit terms
  double * restrict srca = fluid->srcuz.alpha.data;
  // buffer for implicit terms
  double * restrict srcg = fluid->srcuz.gamma.data;
  const double diffusivity = fluid_compute_momentum_diffusivity(fluid);
  // advective contributions, always explicit
  advection_x(domain, uz, ux, srca);
  advection_y(domain, uz, uy, srca);
  advection_z(domain, uz,     srca);
  // pressure-gradient contribution, always implicit
  pressure(domain, p, srcg);
  // diffusive contributions, can be explicit or implicit
  diffusion_x(domain, diffusivity, uz, param_m_implicit_x ? srcg : srca);
  diffusion_y(domain, diffusivity, uz, param_m_implicit_y ? srcg : srca);
  diffusion_z(domain, diffusivity, uz, param_m_implicit_z ? srcg : srca);
  return 0;
}

The stored values are used to compute \(\Delta u_i\):

src/fluid/predict/ux.c¶

    const double coef_a = rkcoefs[rkstep].alpha;
    const double coef_b = rkcoefs[rkstep].beta ;
    const double coef_g = rkcoefs[rkstep].gamma;
    const double * restrict srcuxa = fluid->srcux.alpha.data;
    const double * restrict srcuxb = fluid->srcux.beta .data;
    const double * restrict srcuxg = fluid->srcux.gamma.data;
    const int isize = domain->mysizes[0];
    const int jsize = domain->mysizes[1];
#if NDIMS == 3
    const int ksize = domain->mysizes[2];
#endif
    double * restrict dux = linear_system.x1pncl;
#if NDIMS == 2
    const size_t nitems = (isize - 1) * jsize;
#else
    const size_t nitems = (isize - 1) * jsize * ksize;
#endif
    for (size_t n = 0; n < nitems; n++) {
      dux[n] =
        + coef_a * dt * srcuxa[n]
        + coef_b * dt * srcuxb[n]
        + coef_g * dt * srcuxg[n];
    }

src/fluid/predict/uy.c¶

    const double coef_a = rkcoefs[rkstep].alpha;
    const double coef_b = rkcoefs[rkstep].beta ;
    const double coef_g = rkcoefs[rkstep].gamma;
    const double * restrict srcuya = fluid->srcuy.alpha.data;
    const double * restrict srcuyb = fluid->srcuy.beta .data;
    const double * restrict srcuyg = fluid->srcuy.gamma.data;
    const int isize = domain->mysizes[0];
    const int jsize = domain->mysizes[1];
#if NDIMS == 3
    const int ksize = domain->mysizes[2];
#endif
    double * restrict duy = linear_system.x1pncl;
#if NDIMS == 2
    const size_t nitems = isize * jsize;
#else
    const size_t nitems = isize * jsize * ksize;
#endif
    for (size_t n = 0; n < nitems; n++) {
      duy[n] =
        + coef_a * dt * srcuya[n]
        + coef_b * dt * srcuyb[n]
        + coef_g * dt * srcuyg[n];
    }

src/fluid/predict/uz.c¶

const double coef_a = rkcoefs[rkstep].alpha;
const double coef_b = rkcoefs[rkstep].beta ;
const double coef_g = rkcoefs[rkstep].gamma;
const double * restrict srcuza = fluid->srcuz.alpha.data;
const double * restrict srcuzb = fluid->srcuz.beta .data;
const double * restrict srcuzg = fluid->srcuz.gamma.data;
const int isize = domain->mysizes[0];
const int jsize = domain->mysizes[1];
const int ksize = domain->mysizes[2];
double * restrict duz = linear_system.x1pncl;
const size_t nitems = isize * jsize * ksize;
for (size_t n = 0; n < nitems; n++) {
  duz[n] =
    + coef_a * dt * srcuza[n]
    + coef_b * dt * srcuzb[n]
    + coef_g * dt * srcuzg[n];
}

When necessary, linear systems are solved to take care of the implicit treatments:

src/fluid/predict/ux.c¶

if (param_m_implicit_x) {
  tdm_info_t * tdm_info = linear_system.tdm_x;
  int size = 0;
  double * restrict tdm_l = NULL;
  double * restrict tdm_c = NULL;
  double * restrict tdm_u = NULL;
  tdm.get_size(tdm_info, &size);
  tdm.get_l(tdm_info, &tdm_l);
  tdm.get_c(tdm_info, &tdm_c);
  tdm.get_u(tdm_info, &tdm_u);
  const laplacian_t * lapx = laplacians.lapx;
  for (int i = 0; i < size; i++) {
    tdm_l[i] =    - prefactor * lapx[i].l;
    tdm_c[i] = 1. - prefactor * lapx[i].c;
    tdm_u[i] =    - prefactor * lapx[i].u;
  }
  tdm.solve(tdm_info, linear_system.x1pncl);
}

src/fluid/predict/ux.c¶

if (param_m_implicit_y) {
  sdecomp.transpose.execute(
      linear_system.transposer_x1_to_y1,
      linear_system.x1pncl,
      linear_system.y1pncl
  );
  tdm_info_t * tdm_info = linear_system.tdm_y;
  int size = 0;
  double * restrict tdm_l = NULL;
  double * restrict tdm_c = NULL;
  double * restrict tdm_u = NULL;
  tdm.get_size(tdm_info, &size);
  tdm.get_l(tdm_info, &tdm_l);
  tdm.get_c(tdm_info, &tdm_c);
  tdm.get_u(tdm_info, &tdm_u);
  const laplacian_t * lapy = &laplacians.lapy;
  for (int j = 0; j < size; j++) {
    tdm_l[j] =    - prefactor * (*lapy).l;
    tdm_c[j] = 1. - prefactor * (*lapy).c;
    tdm_u[j] =    - prefactor * (*lapy).u;
  }
  tdm.solve(tdm_info, linear_system.y1pncl);
  sdecomp.transpose.execute(
      linear_system.transposer_y1_to_x1,
      linear_system.y1pncl,
      linear_system.x1pncl
  );
}

src/fluid/predict/ux.c¶

if (param_m_implicit_z) {
  sdecomp.transpose.execute(
      linear_system.transposer_x1_to_z2,
      linear_system.x1pncl,
      linear_system.z2pncl
  );
  tdm_info_t * tdm_info = linear_system.tdm_z;
  int size = 0;
  double * restrict tdm_l = NULL;
  double * restrict tdm_c = NULL;
  double * restrict tdm_u = NULL;
  tdm.get_size(tdm_info, &size);
  tdm.get_l(tdm_info, &tdm_l);
  tdm.get_c(tdm_info, &tdm_c);
  tdm.get_u(tdm_info, &tdm_u);
  const laplacian_t * lapz = &laplacians.lapz;
  for (int k = 0; k < size; k++) {
    tdm_l[k] =    - prefactor * (*lapz).l;
    tdm_c[k] = 1. - prefactor * (*lapz).c;
    tdm_u[k] =    - prefactor * (*lapz).u;
  }
  tdm.solve(tdm_info, linear_system.z2pncl);
  sdecomp.transpose.execute(
      linear_system.transposer_z2_to_x1,
      linear_system.z2pncl,
      linear_system.x1pncl
  );
}

src/fluid/predict/uy.c¶

if (param_m_implicit_x) {
  tdm_info_t * tdm_info = linear_system.tdm_x;
  int size = 0;
  double * restrict tdm_l = NULL;
  double * restrict tdm_c = NULL;
  double * restrict tdm_u = NULL;
  tdm.get_size(tdm_info, &size);
  tdm.get_l(tdm_info, &tdm_l);
  tdm.get_c(tdm_info, &tdm_c);
  tdm.get_u(tdm_info, &tdm_u);
  const laplacian_t * lapx = laplacians.lapx;
  for (int i = 0; i < size; i++) {
    tdm_l[i] =    - prefactor * lapx[i].l;
    tdm_c[i] = 1. - prefactor * lapx[i].c;
    tdm_u[i] =    - prefactor * lapx[i].u;
  }
  tdm.solve(tdm_info, linear_system.x1pncl);
}

src/fluid/predict/uy.c¶

if (param_m_implicit_y) {
  sdecomp.transpose.execute(
      linear_system.transposer_x1_to_y1,
      linear_system.x1pncl,
      linear_system.y1pncl
  );
  tdm_info_t * tdm_info = linear_system.tdm_y;
  int size = 0;
  double * restrict tdm_l = NULL;
  double * restrict tdm_c = NULL;
  double * restrict tdm_u = NULL;
  tdm.get_size(tdm_info, &size);
  tdm.get_l(tdm_info, &tdm_l);
  tdm.get_c(tdm_info, &tdm_c);
  tdm.get_u(tdm_info, &tdm_u);
  const laplacian_t * lapy = &laplacians.lapy;
  for (int j = 0; j < size; j++) {
    tdm_l[j] =    - prefactor * (*lapy).l;
    tdm_c[j] = 1. - prefactor * (*lapy).c;
    tdm_u[j] =    - prefactor * (*lapy).u;
  }
  tdm.solve(tdm_info, linear_system.y1pncl);
  sdecomp.transpose.execute(
      linear_system.transposer_y1_to_x1,
      linear_system.y1pncl,
      linear_system.x1pncl
  );
}

src/fluid/predict/uy.c¶

if (param_m_implicit_z) {
  sdecomp.transpose.execute(
      linear_system.transposer_x1_to_z2,
      linear_system.x1pncl,
      linear_system.z2pncl
  );
  tdm_info_t * tdm_info = linear_system.tdm_z;
  int size = 0;
  double * restrict tdm_l = NULL;
  double * restrict tdm_c = NULL;
  double * restrict tdm_u = NULL;
  tdm.get_size(tdm_info, &size);
  tdm.get_l(tdm_info, &tdm_l);
  tdm.get_c(tdm_info, &tdm_c);
  tdm.get_u(tdm_info, &tdm_u);
  const laplacian_t * lapz = &laplacians.lapz;
  for (int k = 0; k < size; k++) {
    tdm_l[k] =    - prefactor * (*lapz).l;
    tdm_c[k] = 1. - prefactor * (*lapz).c;
    tdm_u[k] =    - prefactor * (*lapz).u;
  }
  tdm.solve(tdm_info, linear_system.z2pncl);
  sdecomp.transpose.execute(
      linear_system.transposer_z2_to_x1,
      linear_system.z2pncl,
      linear_system.x1pncl
  );
}

src/fluid/predict/uz.c¶

if (param_m_implicit_x) {
  tdm_info_t * tdm_info = linear_system.tdm_x;
  int size = 0;
  double * restrict tdm_l = NULL;
  double * restrict tdm_c = NULL;
  double * restrict tdm_u = NULL;
  tdm.get_size(tdm_info, &size);
  tdm.get_l(tdm_info, &tdm_l);
  tdm.get_c(tdm_info, &tdm_c);
  tdm.get_u(tdm_info, &tdm_u);
  const laplacian_t * lapx = laplacians.lapx;
  for (int i = 0; i < size; i++) {
    tdm_l[i] =    - prefactor * lapx[i].l;
    tdm_c[i] = 1. - prefactor * lapx[i].c;
    tdm_u[i] =    - prefactor * lapx[i].u;
  }
  tdm.solve(tdm_info, linear_system.x1pncl);
}

src/fluid/predict/uz.c¶

if (param_m_implicit_y) {
  sdecomp.transpose.execute(
      linear_system.transposer_x1_to_y1,
      linear_system.x1pncl,
      linear_system.y1pncl
  );
  tdm_info_t * tdm_info = linear_system.tdm_y;
  int size = 0;
  double * restrict tdm_l = NULL;
  double * restrict tdm_c = NULL;
  double * restrict tdm_u = NULL;
  tdm.get_size(tdm_info, &size);
  tdm.get_l(tdm_info, &tdm_l);
  tdm.get_c(tdm_info, &tdm_c);
  tdm.get_u(tdm_info, &tdm_u);
  const laplacian_t * lapy = &laplacians.lapy;
  for (int j = 0; j < size; j++) {
    tdm_l[j] =    - prefactor * (*lapy).l;
    tdm_c[j] = 1. - prefactor * (*lapy).c;
    tdm_u[j] =    - prefactor * (*lapy).u;
  }
  tdm.solve(tdm_info, linear_system.y1pncl);
  sdecomp.transpose.execute(
      linear_system.transposer_y1_to_x1,
      linear_system.y1pncl,
      linear_system.x1pncl
  );
}

src/fluid/predict/uz.c¶

if (param_m_implicit_z) {
  sdecomp.transpose.execute(
      linear_system.transposer_x1_to_z2,
      linear_system.x1pncl,
      linear_system.z2pncl
  );
  tdm_info_t * tdm_info = linear_system.tdm_z;
  int size = 0;
  double * restrict tdm_l = NULL;
  double * restrict tdm_c = NULL;
  double * restrict tdm_u = NULL;
  tdm.get_size(tdm_info, &size);
  tdm.get_l(tdm_info, &tdm_l);
  tdm.get_c(tdm_info, &tdm_c);
  tdm.get_u(tdm_info, &tdm_u);
  const laplacian_t * lapz = &laplacians.lapz;
  for (int k = 0; k < size; k++) {
    tdm_l[k] =    - prefactor * (*lapz).l;
    tdm_c[k] = 1. - prefactor * (*lapz).c;
    tdm_u[k] =    - prefactor * (*lapz).u;
  }
  tdm.solve(tdm_info, linear_system.z2pncl);
  sdecomp.transpose.execute(
      linear_system.transposer_z2_to_x1,
      linear_system.z2pncl,
      linear_system.x1pncl
  );
}

Finally the velocity field is updated:

src/fluid/predict/ux.c¶

    const int isize = domain->mysizes[0];
    const int jsize = domain->mysizes[1];
#if NDIMS == 3
    const int ksize = domain->mysizes[2];
#endif
    const double * restrict dux = linear_system.x1pncl;
    double * restrict ux = fluid->ux.data;
    BEGIN
#if NDIMS == 2
      UX(i, j) += dux[cnt];
#else
      UX(i, j, k) += dux[cnt];
#endif
    END
    if (0 != fluid_update_boundaries_ux(domain, &fluid->ux)) {
      return 1;
    }

src/fluid/predict/uy.c¶

    const int isize = domain->mysizes[0];
    const int jsize = domain->mysizes[1];
#if NDIMS == 3
    const int ksize = domain->mysizes[2];
#endif
    const double * restrict duy = linear_system.x1pncl;
    double * restrict uy = fluid->uy.data;
    BEGIN
#if NDIMS == 2
      UY(i, j) += duy[cnt];
#else
      UY(i, j, k) += duy[cnt];
#endif
    END
    if (0 != fluid_update_boundaries_uy(domain, &fluid->uy)) {
      return 1;
    }

src/fluid/predict/uz.c¶

const int isize = domain->mysizes[0];
const int jsize = domain->mysizes[1];
const int ksize = domain->mysizes[2];
const double * restrict duz = linear_system.x1pncl;
double * restrict uz = fluid->uz.data;
BEGIN
  UZ(i, j, k) += duz[cnt];
END
if (0 != fluid_update_boundaries_uz(domain, &fluid->uz)) {
  return 1;
}

Correction Step¶

The updated velocity field \(u_i^*\), which in general violates the incompressibility, is corrected in the second step (correction step). The idea is mathematically written as

\[u_i^{k+1} = u_i^* - \gamma^k \Delta t \frac{1}{\sfact{i}} \dif{\psi}{\gcs{i}},\]

where \(\psi\) is a scalar potential to be given. By taking the (discrete) divergence, we obtain

\[\frac{1}{J} \dif{}{\gcs{i}} \left( \frac{J}{\sfact{i}} \vel{i}^{k+1} \right) = \frac{1}{J} \dif{}{\gcs{i}} \left( \frac{J}{\sfact{i}} \vel{i}^* \right) - \gamma^k \Delta t \frac{1}{J} \dif{}{\gcs{i}} \left( \frac{J}{\sfact{i}} \frac{1}{\sfact{i}} \dif{\psi}{\gcs{i}} \right).\]

By requesting the (discrete) incompressibility constraint on the new velocity field (namely the left-hand-side term to be zero), we obtain

\[\frac{1}{J} \dif{}{\gcs{i}} \left( \frac{J}{\sfact{i}} \frac{1}{\sfact{i}} \dif{\psi}{\gcs{i}} \right) = \frac{1}{\gamma^k \Delta t} \frac{1}{J} \dif{}{\gcs{i}} \left( \frac{J}{\sfact{i}} \vel{i}^* \right),\]

which is a Poisson equation with respect to \(\psi\).

The right-hand-side term is computed as follows in the code:

src/fluid/compute_potential.c¶

static int assign_input (
    const domain_t * domain,
    const size_t rkstep,
    const double dt,
    const fluid_t * fluid,
    double * restrict rhs
) {
  const int isize = domain->mysizes[0];
  const int jsize = domain->mysizes[1];
#if NDIMS == 3
  const int ksize = domain->mysizes[2];
#endif
  const double * restrict hxxf = domain->hxxf;
  const double hy = domain->hy;
#if NDIMS == 3
  const double hz = domain->hz;
#endif
  const double * restrict jdxf = domain->jdxf;
  const double * restrict jdxc = domain->jdxc;
  const double * restrict ux = fluid->ux.data;
  const double * restrict uy = fluid->uy.data;
#if NDIMS == 3
  const double * restrict uz = fluid->uz.data;
#endif
  // normalise FFT beforehand
#if NDIMS == 2
  const double norm = 1. * domain->glsizes[1];
#else
  const double norm = 1. * domain->glsizes[1] * domain->glsizes[2];
#endif
  const double prefactor = 1. / (rkcoefs[rkstep].gamma * dt) / norm;
  BEGIN
    const double hx_xm = HXXF(i  );
    const double hx_xp = HXXF(i+1);
    const double jd_xm = JDXF(i  );
    const double jd_x0 = JDXC(i  );
    const double jd_xp = JDXF(i+1);
#if NDIMS == 2
    const double ux_xm = UX(i  , j  );
    const double ux_xp = UX(i+1, j  );
    const double uy_ym = UY(i  , j  );
    const double uy_yp = UY(i  , j+1);
#else
    const double ux_xm = UX(i  , j  , k  );
    const double ux_xp = UX(i+1, j  , k  );
    const double uy_ym = UY(i  , j  , k  );
    const double uy_yp = UY(i  , j+1, k  );
    const double uz_zm = UZ(i  , j  , k  );
    const double uz_zp = UZ(i  , j  , k+1);
#endif
    const double div = 1. / jd_x0 * (
        - jd_xm / hx_xm * ux_xm + jd_xp / hx_xp * ux_xp
        - jd_x0 / hy    * uy_ym + jd_x0 / hy    * uy_yp
#if NDIMS == 3
        - jd_x0 / hz    * uz_zm + jd_x0 / hz    * uz_zp
#endif
    );
    rhs[cnt] = prefactor * div;
  END
  return 0;
}

After solving the Poisson equation, the velocity field is corrected as follows in the code:

src/fluid/correct/ux.c¶

int fluid_correct_velocity_ux (
    const domain_t * domain,
    const double prefactor,
    fluid_t * fluid
) {
  const int isize = domain->mysizes[0];
  const int jsize = domain->mysizes[1];
#if NDIMS == 3
  const int ksize = domain->mysizes[2];
#endif
  const double * restrict hxxf = domain->hxxf;
  const double * restrict psi = fluid->psi.data;
  double * restrict ux = fluid->ux.data;
  BEGIN
    const double hx = HXXF(i  );
#if NDIMS == 2
    const double psi_xm = PSI(i-1, j  );
    const double psi_xp = PSI(i  , j  );
    double * vel = &UX(i, j);
#else
    const double psi_xm = PSI(i-1, j  , k  );
    const double psi_xp = PSI(i  , j  , k  );
    double * vel = &UX(i, j, k);
#endif
    *vel -= prefactor / hx * (
        - psi_xm
        + psi_xp
    );
  END
  // update boundary and halo cells
  if (0 != fluid_update_boundaries_ux(domain, &fluid->ux)) {
    return 1;
  }
  return 0;
}

src/fluid/correct/uy.c¶

int fluid_correct_velocity_uy (
    const domain_t * domain,
    const double prefactor,
    fluid_t * fluid
) {
  const int isize = domain->mysizes[0];
  const int jsize = domain->mysizes[1];
#if NDIMS == 3
  const int ksize = domain->mysizes[2];
#endif
  const double hy = domain->hy;
  const double * restrict psi = fluid->psi.data;
  double * restrict uy = fluid->uy.data;
  BEGIN
#if NDIMS == 2
    const double psi_ym = PSI(i  , j-1);
    const double psi_yp = PSI(i  , j  );
    double * vel = &UY(i, j);
#else
    const double psi_ym = PSI(i  , j-1, k  );
    const double psi_yp = PSI(i  , j  , k  );
    double * vel = &UY(i, j, k);
#endif
    *vel -= prefactor / hy * (
        - psi_ym
        + psi_yp
    );
  END
  // update boundary and halo cells
  if (0 != fluid_update_boundaries_uy(domain, &fluid->uy)) {
    return 1;
  }
  return 0;
}

src/fluid/correct/uz.c¶

int fluid_correct_velocity_uz (
    const domain_t * domain,
    const double prefactor,
    fluid_t * fluid
) {
  const int isize = domain->mysizes[0];
  const int jsize = domain->mysizes[1];
  const int ksize = domain->mysizes[2];
  const double hz = domain->hz;
  const double * restrict psi = fluid->psi.data;
  double * restrict uz = fluid->uz.data;
  for (int k = 1; k <= ksize; k++) {
    for (int j = 1; j <= jsize; j++) {
      for (int i = 1; i <= isize; i++) {
        const double psi_zm = PSI(i  , j  , k-1);
        const double psi_zp = PSI(i  , j  , k  );
        UZ(i, j, k) -= prefactor / hz * (
            - psi_zm
            + psi_zp
        );
      }
    }
  }
  // update boundary and halo cells
  if (0 != fluid_update_boundaries_uz(domain, &fluid->uz)) {
    return 1;
  }
  return 0;
}

Pressure and Scalar Potential¶

Finally we relate the pressure field with the scalar potential to close the system. Each Runge-Kutta step when all diffusive terms are treated explicitly is given by

\[ \begin{align}\begin{aligned}\Delta u_i & = \gamma^k \Delta t P_i^k + \alpha^k \Delta t \left( A_i^{k } + D_{i1}^{k } + D_{i2}^{k } + D_{i3}^{k } \right) + \beta^k \Delta t \left( A_i^{k-1} + D_{i1}^{k-1} + D_{i2}^{k-1} + D_{i3}^{k-1} \right),\\u_i^* & = u_i^k + \Delta u_i,\\u_i^{k+1} & = u_i^* - \gamma^k \Delta t \frac{1}{\sfact{i}} \dif{\psi}{\gcs{i}}.\end{aligned}\end{align} \]

Summing all three steps yield

\[u_i^{k+1} = u_i^k - \gamma^k \Delta t \frac{1}{\sfact{i}} \dif{\psi}{\gcs{i}} + \gamma^k \Delta t P_i^k + \alpha^k \Delta t \left( A_i^{k } + D_{i1}^{k } + D_{i2}^{k } + D_{i3}^{k } \right) + \beta^k \Delta t \left( A_i^{k-1} + D_{i1}^{k-1} + D_{i2}^{k-1} + D_{i3}^{k-1} \right).\]

Since the pressure field should be treated implicitly in time, we find a requirement:

\[- \gamma^k \Delta t \frac{1}{\sfact{i}} \dif{\psi}{\gcs{i}} + \gamma^k \Delta t P_i^k = \gamma^k \Delta t P_i^{k+1},\]

or equivalently

\[p^{k+1} = p^k + \psi.\]

Next, we consider cases where the diffusive terms are partially treated implicitly in time; for instance, the following relation holds when the diffusive terms are treated implicitly only in \(x\) direction:

\[ \begin{align}\begin{aligned}\Delta u_i & = \gamma^k \Delta t P_i^k + \alpha^k \Delta t \left( A_i^{k } + D_{i2}^{k } + D_{i3}^{k } \right) + \beta^k \Delta t \left( A_i^{k-1} + D_{i2}^{k-1} + D_{i3}^{k-1} \right) + \gamma^k \Delta t D_{i1}^{k },\\u_i^* & = u_i^k + \left\{ 1 - \lap{1}{c} \right\}^{-1} \Delta u_i,\\u_i^{k+1} & = u_i^* - \gamma^k \Delta t \frac{1}{\sfact{i}} \dif{\psi}{\gcs{i}}.\end{aligned}\end{align} \]

Note that, in the second step, the left-hand side is \(u_i^*\) while it should be \(u_i^{k+1}\) but is unknown. By requesting the pressure-gradient term to be implicit in time and with some algebra, we obtain

\[\gamma^k \Delta t \left\{ 1 - \lap{1}{c} \right\} \frac{1}{\sfact{i}} \dif{\psi}{\gcs{i}} - \gamma^k \Delta t P_i^k = - \gamma^k \Delta t P_i^{k+1},\]

or equivalently

\[\frac{1}{\sfact{i}} \dif{p^{k+1}}{\gcs{i}} = \frac{1}{\sfact{i}} \dif{p^k}{\gcs{i}} + \left\{ 1 - \lap{1}{c} \right\} \frac{1}{\sfact{i}} \dif{\psi}{\gcs{i}}.\]

Since the spatial-differential operators are interchangeable, we simplify the relation to

\[p^{k+1} = p^k + \psi - \lap{1}{c} \psi.\]

Similarly, when all diffusive terms are treated implicitly, we have

\[ \begin{align}\begin{aligned}\Delta u_i & = \gamma^k \Delta t P_i^k + \alpha^k \Delta t A_i^{k } + \beta^k \Delta t A_i^{k-1} + \gamma^k \Delta t \left( D_{i1}^{k } + D_{i2}^{k } + D_{i3}^{k } \right),\\u_i^* & = u_i^k + \left\{ 1 - \lap{3}{c} \right\}^{-1} \left\{ 1 - \lap{2}{c} \right\}^{-1} \left\{ 1 - \lap{1}{c} \right\}^{-1} \Delta u_i,\\u_i^{k+1} & = u_i^* - \gamma^k \Delta t \frac{1}{\sfact{i}} \dif{\psi}{\gcs{i}},\\p^{k+1} & = p^k + \psi - \lap{1}{c} \psi - \lap{2}{c} \psi - \lap{3}{c} \psi.\end{aligned}\end{align} \]

Updating pressure field using the scalar potential is implemented as follows:

src/fluid/update_pressure.c¶

int fluid_update_pressure (
    const domain_t * domain,
    const size_t rkstep,
    const double dt,
    fluid_t * fluid
) {
  // explicit contribution, always present
  explicit_contribution(domain, fluid);
  const double prefactor =
    0.5 * rkcoefs[rkstep].gamma * dt * fluid_compute_momentum_diffusivity(fluid);
  // additional terms if diffusive terms in the direction is treated implicitly
  if (param_m_implicit_x) {
    implicit_x_contribution(domain, prefactor, fluid);
  }
  if (param_m_implicit_y) {
    implicit_y_contribution(domain, prefactor, fluid);
  }
#if NDIMS == 3
  if (param_m_implicit_z) {
    implicit_z_contribution(domain, prefactor, fluid);
  }
#endif
  // impose boundary conditions and communicate halo cells
  if (0 != fluid_update_boundaries_p(domain, &fluid->p)) {
    return 1;
  }
  return 0;
}

The explicit contribution, which is always present, is given here:

src/fluid/update_pressure.c¶

static int explicit_contribution (
    const domain_t * domain,
    const fluid_t * fluid
) {
  const int isize = domain->mysizes[0];
  const int jsize = domain->mysizes[1];
#if NDIMS == 3
  const int ksize = domain->mysizes[2];
#endif
  const double * restrict psi = fluid->psi.data;
  double * restrict p = fluid->p.data;
  BEGIN
#if NDIMS == 2
    P(i, j) += PSI(i, j);
#else
    P(i, j, k) += PSI(i, j, k);
#endif
  END
  return 0;
}

The implicit contributions, which is needed when the Laplace operator in the direction is implicitly treated, are given here:

src/fluid/update_pressure.c¶

static int implicit_x_contribution (
    const domain_t * domain,
    const double prefactor,
    fluid_t * fluid
) {
  const int isize = domain->mysizes[0];
  const int jsize = domain->mysizes[1];
#if NDIMS == 3
  const int ksize = domain->mysizes[2];
#endif
  const double * restrict hxxf = domain->hxxf;
  const double * restrict jdxf = domain->jdxf;
  const double * restrict jdxc = domain->jdxc;
  const double * restrict psi = fluid->psi.data;
  double * restrict p = fluid->p.data;
  BEGIN
    const double hx_xm = HXXF(i  );
    const double hx_xp = HXXF(i+1);
    const double jd_xm = JDXF(i  );
    const double jd_x0 = JDXC(i  );
    const double jd_xp = JDXF(i+1);
    const double l = 1. / jd_x0 * jd_xm / hx_xm / hx_xm;
    const double u = 1. / jd_x0 * jd_xp / hx_xp / hx_xp;
    const double c = - l - u;
#if NDIMS == 2
    const double psi_xm = PSI(i-1, j  );
    const double psi_x0 = PSI(i  , j  );
    const double psi_xp = PSI(i+1, j  );
    double * pre = &P(i, j);
#else
    const double psi_xm = PSI(i-1, j  , k  );
    const double psi_x0 = PSI(i  , j  , k  );
    const double psi_xp = PSI(i+1, j  , k  );
    double * pre = &P(i, j, k);
#endif
    *pre -= prefactor * (
        + l * psi_xm
        + c * psi_x0
        + u * psi_xp
    );
  END
  return 0;
}

src/fluid/update_pressure.c¶

static int implicit_y_contribution (
    const domain_t * domain,
    const double prefactor,
    fluid_t * fluid
) {
  const int isize = domain->mysizes[0];
  const int jsize = domain->mysizes[1];
#if NDIMS == 3
  const int ksize = domain->mysizes[2];
#endif
  const double hy = domain->hy;
  const double * restrict psi = fluid->psi.data;
  double * restrict p = fluid->p.data;
  BEGIN
    const double l = 1. / hy / hy;
    const double u = 1. / hy / hy;
    const double c = - l - u;
#if NDIMS == 2
    const double psi_ym = PSI(i  , j-1);
    const double psi_y0 = PSI(i  , j  );
    const double psi_yp = PSI(i  , j+1);
    double * pre = &P(i, j);
#else
    const double psi_ym = PSI(i  , j-1, k  );
    const double psi_y0 = PSI(i  , j  , k  );
    const double psi_yp = PSI(i  , j+1, k  );
    double * pre = &P(i, j, k);
#endif
    *pre -= prefactor * (
        + l * psi_ym
        + c * psi_y0
        + u * psi_yp
    );
  END
  return 0;
}

src/fluid/update_pressure.c¶

static int implicit_z_contribution (
    const domain_t * domain,
    const double prefactor,
    fluid_t * fluid
) {
  const int isize = domain->mysizes[0];
  const int jsize = domain->mysizes[1];
  const int ksize = domain->mysizes[2];
  const double hz = domain->hz;
  const double * restrict psi = fluid->psi.data;
  double * restrict p = fluid->p.data;
  BEGIN
    const double l = 1. / hz / hz;
    const double u = 1. / hz / hz;
    const double c = - l - u;
    const double psi_zm = PSI(i  , j  , k-1);
    const double psi_z0 = PSI(i  , j  , k  );
    const double psi_zp = PSI(i  , j  , k+1);
    P(i, j, k) -= prefactor * (
        + l * psi_zm
        + c * psi_z0
        + u * psi_zp
    );
  END
  return 0;
}

Momentum Balance¶

SMAC method¶

Prediction Step¶

Correction Step¶

Pressure and Scalar Potential¶

Simple NS Solver

Navigation