Merge branch 'master' into sink_20190723

Conflicts: acc/mhd_solver/stencil_process.sps I've mannaully resolved the conflict, only that I'm leaving int3 globalVertexIdx as is, as instructed by Miikka.
2019-08-12 14:01:19 +08:00
parent b782ead4f3 fdadd463b7
commit e7ff447510
17 changed files with 244 additions and 885 deletions
--- a/acc/mhd_solver/stencil_assembly.sas
+++ b/acc/mhd_solver/stencil_assembly.sas
@@ -1,11 +1,11 @@
 Preprocessed Scalar
-value(in Scalar vertex)
+value(in ScalarField vertex)
 {
    return vertex[vertexIdx];
 }

 Preprocessed Vector
-gradient(in Scalar vertex)
+gradient(in ScalarField vertex)
 {
    return (Vector){derx(vertexIdx, vertex),
                    dery(vertexIdx, vertex),
@@ -15,7 +15,7 @@ gradient(in Scalar vertex)
 #if LUPWD

 Preprocessed Scalar
-der6x_upwd(in Scalar vertex)
+der6x_upwd(in ScalarField vertex)
 {
    Scalar inv_ds = DCONST_REAL(AC_inv_dsx);

@@ -30,7 +30,7 @@ der6x_upwd(in Scalar vertex)
 }

 Preprocessed Scalar
-der6y_upwd(in Scalar vertex)
+der6y_upwd(in ScalarField vertex)
 {
    Scalar inv_ds = DCONST_REAL(AC_inv_dsy);

@@ -45,7 +45,7 @@ der6y_upwd(in Scalar vertex)
 }

 Preprocessed Scalar
-der6z_upwd(in Scalar vertex)
+der6z_upwd(in ScalarField vertex)
 {
    Scalar inv_ds = DCONST_REAL(AC_inv_dsz);

@@ -62,7 +62,7 @@ der6z_upwd(in Scalar vertex)
 #endif

 Preprocessed Matrix
-hessian(in Scalar vertex)
+hessian(in ScalarField vertex)
 {
    Matrix hessian;

--- a/acc/mhd_solver/stencil_process.sps
+++ b/acc/mhd_solver/stencil_process.sps
@@ -23,14 +23,14 @@ uniform int ny;
 uniform int nz;

 Vector
-value(in Vector uu)
+value(in VectorField uu)
 {
    return (Vector){value(uu.x), value(uu.y), value(uu.z)};
 }

 #if LUPWD
 Scalar
-upwd_der6(in Vector uu, in Scalar lnrho)
+upwd_der6(in VectorField uu, in ScalarField lnrho)
 {
    Scalar uux = fabs(value(uu).x);
    Scalar uuy = fabs(value(uu).y);
@@ -40,13 +40,13 @@ upwd_der6(in Vector uu, in Scalar lnrho)
 #endif

 Matrix
-gradients(in Vector uu)
+gradients(in VectorField uu)
 {
    return (Matrix){gradient(uu.x), gradient(uu.y), gradient(uu.z)};
 }

 Scalar
-continuity(in Vector uu, in Scalar lnrho) {
+continuity(in VectorField uu, in ScalarField lnrho) {
    return -dot(value(uu), gradient(lnrho))
 #if LUPWD
           //This is a corrective hyperdiffusion term for upwinding.
@@ -124,7 +124,7 @@ accretion_profile(int3 globalVertexIdx, in Scalar lnrho){

 #if LENTROPY
 Vector
-momentum(int3 globalVertexIdx, in Vector uu, in Scalar lnrho, in Scalar ss, in Vector aa) {
+momentum(int3 globalVertexIdx, in VectorField uu, in ScalarField lnrho, in ScalarField ss, in VectorField aa) {
    const Matrix S = stress_tensor(uu);
    const Scalar cs2 = cs2_sound * exp(gamma * value(ss) / cp_sound + (gamma - 1) * (value(lnrho) - lnrho0));
    const Vector  j = (Scalar(1.) / mu0) * (gradient_of_divergence(aa) - laplace_vec(aa)); // Current density
@@ -152,13 +152,10 @@ momentum(int3 globalVertexIdx, in Vector uu, in Scalar lnrho, in Scalar ss, in V
 }
 #elif LTEMPERATURE
 Vector
-momentum(int3 globalVertexIdx, in Vector uu, in Scalar lnrho, in Scalar tt) {
+momentum(int3 globalVertexIdx, in VectorField uu, in ScalarField lnrho, in ScalarField tt) {
    Vector mom;
-
    const Matrix S = stress_tensor(uu);
-
    const Vector pressure_term = (cp_sound - cv_sound) * (gradient(tt) + value(tt) * gradient(lnrho));
-
    mom = -mul(gradients(uu), value(uu)) -
    pressure_term +
    nu_visc *
@@ -175,9 +172,8 @@ momentum(int3 globalVertexIdx, in Vector uu, in Scalar lnrho, in Scalar tt) {
 }
 #else
 Vector
-momentum(int3 globalVertexIdx, in Vector uu, in Scalar lnrho) {
+momentum(int3 globalVertexIdx, in VectorField uu, in ScalarField lnrho) {
    Vector mom;
-
    const Matrix S = stress_tensor(uu);

    // Isothermal: we have constant speed of sound
@@ -200,7 +196,7 @@ momentum(int3 globalVertexIdx, in Vector uu, in Scalar lnrho) {


 Vector
-induction(in Vector uu, in Vector aa) {
+induction(in VectorField uu, in VectorField aa) {
  // Note: We do (-nabla^2 A + nabla(nabla dot A)) instead of (nabla x (nabla
  // x A)) in order to avoid taking the first derivative twice (did the math,
  // yes this actually works. See pg.28 in arXiv:astro-ph/0109497)
@@ -218,7 +214,7 @@ induction(in Vector uu, in Vector aa) {

 #if LENTROPY
 Scalar
-lnT( in Scalar ss, in Scalar lnrho) {
+lnT( in ScalarField ss, in ScalarField lnrho) {
  const Scalar lnT = lnT0 + gamma * value(ss) / cp_sound +
    (gamma - Scalar(1.)) * (value(lnrho) - lnrho0);
  return lnT;
@@ -226,7 +222,7 @@ lnT( in Scalar ss, in Scalar lnrho) {

 // Nabla dot (K nabla T) / (rho T)
 Scalar
-heat_conduction( in Scalar ss, in Scalar lnrho) {
+heat_conduction( in ScalarField ss, in ScalarField lnrho) {
  const Scalar inv_cp_sound = AcReal(1.) / cp_sound;

  const Vector grad_ln_chi = - gradient(lnrho);
@@ -249,7 +245,7 @@ heating(const int i, const int j, const int k) {
 }

 Scalar
-entropy(in Scalar ss, in Vector uu, in Scalar lnrho, in Vector aa) {
+entropy(in ScalarField ss, in VectorField uu, in ScalarField lnrho, in VectorField aa) {
    const Matrix S = stress_tensor(uu);
    const Scalar inv_pT = Scalar(1.) / (exp(value(lnrho)) * exp(lnT(ss, lnrho)));
    const Vector  j = (Scalar(1.) / mu0) * (gradient_of_divergence(aa) - laplace_vec(aa)); // Current density
@@ -266,7 +262,7 @@ entropy(in Scalar ss, in Vector uu, in Scalar lnrho, in Vector aa) {

 #if LTEMPERATURE
 Scalar
-heat_transfer(in Vector uu, in Scalar lnrho, in Scalar tt)
+heat_transfer(in VectorField uu, in ScalarField lnrho, in ScalarField tt)
 {
    const Matrix S = stress_tensor(uu);
    const Scalar heat_diffusivity_k = 0.0008; //8e-4;
@@ -365,26 +361,26 @@ forcing(int3 globalVertexIdx, Scalar dt)

 // Declare input and output arrays using locations specified in the
 // array enum in astaroth.h
-in Scalar lnrho = VTXBUF_LNRHO;
-out Scalar out_lnrho = VTXBUF_LNRHO;
+in ScalarField lnrho(VTXBUF_LNRHO);
+out ScalarField out_lnrho(VTXBUF_LNRHO);

-in Vector uu = (int3) {VTXBUF_UUX, VTXBUF_UUY, VTXBUF_UUZ};
-out Vector out_uu = (int3) {VTXBUF_UUX,VTXBUF_UUY,VTXBUF_UUZ};
+in VectorField uu(VTXBUF_UUX, VTXBUF_UUY, VTXBUF_UUZ);
+out VectorField out_uu(VTXBUF_UUX,VTXBUF_UUY,VTXBUF_UUZ);


 #if LMAGNETIC
-in Vector aa = (int3) {VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ};
-out Vector out_aa = (int3) {VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ};
+in VectorField aa(VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ);
+out VectorField out_aa(VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ);
 #endif

 #if LENTROPY
-in Scalar ss = VTXBUF_ENTROPY;
-out Scalar out_ss = VTXBUF_ENTROPY;
+in ScalarField ss(VTXBUF_ENTROPY);
+out ScalarField out_ss(VTXBUF_ENTROPY);
 #endif

 #if LTEMPERATURE
-in Scalar tt = VTXBUF_TEMPERATURE;
-out Scalar out_tt = VTXBUF_TEMPERATURE;
+in ScalarField tt(VTXBUF_TEMPERATURE);
+out ScalarField out_tt(VTXBUF_TEMPERATURE);
 #endif

 #if LSINK
--- a/acc/pseudodisk/stencil_process_gravx.sps
+++ b/acc/pseudodisk/stencil_process_gravx.sps
@@ -43,19 +43,19 @@ distance_x(Vector a, Vector b)
 }

 Vector
-value(in Vector uu)
+value(in VectorField uu)
 {
    return (Vector){value(uu.x), value(uu.y), value(uu.z)};
 }

 Matrix
-gradients(in Vector uu)
+gradients(in VectorField uu)
 {
    return (Matrix){gradient(uu.x), gradient(uu.y), gradient(uu.z)};
 }

 Scalar
-continuity(in Vector uu, in Scalar lnrho) {
+continuity(in VectorField uu, in ScalarField lnrho) {
    return -dot(value(uu), gradient(lnrho)) - divergence(uu);
 }

@@ -79,7 +79,7 @@ grav_force_line(const int3 vertexIdx)

 #if LENTROPY
 Vector
-momentum(in Vector uu, in Scalar lnrho, in Scalar ss, in Vector aa, const int3 vertexIdx) {
+momentum(in VectorField uu, in ScalarField lnrho, in ScalarField ss, in VectorField aa, const int3 vertexIdx) {
  Vector mom;

  const Matrix S = stress_tensor(uu);
@@ -104,7 +104,7 @@ momentum(in Vector uu, in Scalar lnrho, in Scalar ss, in Vector aa, const int3 v
 }
 #else
 Vector
-momentum(in Vector uu, in Scalar lnrho, const int3 vertexIdx) {
+momentum(in VectorField uu, in ScalarField lnrho, const int3 vertexIdx) {
  Vector mom;

  const Matrix S = stress_tensor(uu);
@@ -123,7 +123,7 @@ momentum(in Vector uu, in Scalar lnrho, const int3 vertexIdx) {


 Vector
-induction(in Vector uu, in Vector aa) {
+induction(in VectorField uu, in VectorField aa) {
  // Note: We do (-nabla^2 A + nabla(nabla dot A)) instead of (nabla x (nabla
  // x A)) in order to avoid taking the first derivative twice (did the math,
  // yes this actually works. See pg.28 in arXiv:astro-ph/0109497)
@@ -141,7 +141,7 @@ induction(in Vector uu, in Vector aa) {

 #if LENTROPY
 Scalar
-lnT( in Scalar ss, in Scalar lnrho) {
+lnT( in ScalarField ss, in ScalarField lnrho) {
  const Scalar lnT = LNT0 + value(ss) / cp_sound +
    (gamma - AcReal(1.)) * (value(lnrho) - LNRHO0);
  return lnT;
@@ -149,7 +149,7 @@ lnT( in Scalar ss, in Scalar lnrho) {

 // Nabla dot (K nabla T) / (rho T)
 Scalar
-heat_conduction( in Scalar ss, in Scalar lnrho) {
+heat_conduction( in ScalarField ss, in ScalarField lnrho) {
  const Scalar inv_cp_sound = AcReal(1.) / cp_sound;

  const Vector grad_ln_chi = (Vector) {
@@ -174,7 +174,7 @@ heating(const int i, const int j, const int k) {
 }

 Scalar
-entropy(in Scalar ss, in Vector uu, in Scalar lnrho, in Vector aa) {
+entropy(in ScalarField ss, in VectorField uu, in ScalarField lnrho, in VectorField aa) {
    const Matrix S = stress_tensor(uu);

    // nabla x nabla x A / mu0 = nabla(nabla dot A) - nabla^2(A)
@@ -193,21 +193,21 @@ entropy(in Scalar ss, in Vector uu, in Scalar lnrho, in Vector aa) {

 // Declare input and output arrays using locations specified in the
 // array enum in astaroth.h
-in Scalar lnrho = VTXBUF_LNRHO;
-out Scalar out_lnrho = VTXBUF_LNRHO;
+in ScalarField lnrho(VTXBUF_LNRHO);
+out ScalarField out_lnrho(VTXBUF_LNRHO);

-in Vector uu = (int3) {VTXBUF_UUX, VTXBUF_UUY, VTXBUF_UUZ};
-out Vector out_uu = (int3) {VTXBUF_UUX,VTXBUF_UUY,VTXBUF_UUZ};
+in VectorField uu(VTXBUF_UUX, VTXBUF_UUY, VTXBUF_UUZ);
+out VectorField out_uu(VTXBUF_UUX,VTXBUF_UUY,VTXBUF_UUZ);


 #if LMAGNETIC
-in Vector aa = (int3) {VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ};
-out Vector out_aa = (int3) {VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ};
+in VectorField aa(VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ);
+out VectorField out_aa(VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ);
 #endif

 #if LENTROPY
-in Scalar ss = VTXBUF_ENTROPY;
-out Scalar out_ss = VTXBUF_ENTROPY;
+in ScalarField ss(VTXBUF_ENTROPY);
+out ScalarField out_ss(VTXBUF_ENTROPY);
 #endif

 Kernel void
--- a/acc/pseudodisk/stencil_process_isotherm_gravx.sps
+++ b/acc/pseudodisk/stencil_process_isotherm_gravx.sps
@@ -40,19 +40,19 @@ distance_x(Vector a, Vector b)
 }

 Vector
-value(in Vector uu)
+value(in VectorField uu)
 {
    return (Vector){value(uu.x), value(uu.y), value(uu.z)};
 }

 Matrix
-gradients(in Vector uu)
+gradients(in VectorField uu)
 {
    return (Matrix){gradient(uu.x), gradient(uu.y), gradient(uu.z)};
 }

 Scalar
-continuity(in Vector uu, in Scalar lnrho) {
+continuity(in VectorField uu, in ScalarField lnrho) {
    return -dot(value(uu), gradient(lnrho)) - divergence(uu);
 }

@@ -77,7 +77,7 @@ grav_force_line(const int3 vertexIdx)


 Vector
-momentum(in Vector uu, in Scalar lnrho, const int3 vertexIdx) {
+momentum(in VectorField uu, in ScalarField lnrho, const int3 vertexIdx) {
  Vector mom;

  const Matrix S = stress_tensor(uu);
@@ -94,7 +94,7 @@ momentum(in Vector uu, in Scalar lnrho, const int3 vertexIdx) {
 }

 Vector
-induction(in Vector uu, in Vector aa) {
+induction(in VectorField uu, in VectorField aa) {
  // Note: We do (-nabla^2 A + nabla(nabla dot A)) instead of (nabla x (nabla
  // x A)) in order to avoid taking the first derivative twice (did the math,
  // yes this actually works. See pg.28 in arXiv:astro-ph/0109497)
@@ -111,15 +111,16 @@ induction(in Vector uu, in Vector aa) {

 // Declare input and output arrays using locations specified in the
 // array enum in astaroth.h
-in Scalar lnrho = VTXBUF_LNRHO;
-out Scalar out_lnrho = VTXBUF_LNRHO;
+in ScalarField lnrho(VTXBUF_LNRHO);
+out ScalarField out_lnrho(VTXBUF_LNRHO);
+
+in VectorField uu(VTXBUF_UUX, VTXBUF_UUY, VTXBUF_UUZ);
+out VectorField out_uu(VTXBUF_UUX,VTXBUF_UUY,VTXBUF_UUZ);

-in Vector uu = (int3) {VTXBUF_UUX, VTXBUF_UUY, VTXBUF_UUZ};
-out Vector out_uu = (int3) {VTXBUF_UUX,VTXBUF_UUY,VTXBUF_UUZ};

 #if LMAGNETIC
-in Vector aa = (int3) {VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ};
-out Vector out_aa = (int3) {VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ};
+in VectorField aa(VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ);
+out VectorField out_aa(VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ);
 #endif

 Kernel void
@@ -132,38 +133,3 @@ solve(Scalar dt) {

  WRITE(out_uu, RK3(out_uu, uu, momentum(uu, lnrho, vertexIdx), dt));
 }
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
--- a/acc/pseudodisk/stencil_process_isotherm_linegrav.sps
+++ b/acc/pseudodisk/stencil_process_isotherm_linegrav.sps
@@ -40,19 +40,19 @@ distance(Vector a, Vector b)
 }

 Vector
-value(in Vector uu)
+value(in VectorField uu)
 {
    return (Vector){value(uu.x), value(uu.y), value(uu.z)};
 }

 Matrix
-gradients(in Vector uu)
+gradients(in VectorField uu)
 {
    return (Matrix){gradient(uu.x), gradient(uu.y), gradient(uu.z)};
 }

 Scalar
-continuity(in Vector uu, in Scalar lnrho) {
+continuity(in VectorField uu, in ScalarField lnrho) {
    return -dot(value(uu), gradient(lnrho)) - divergence(uu);
 }

@@ -82,7 +82,7 @@ grav_force_line(const int3 vertexIdx)


 Vector
-momentum(in Vector uu, in Scalar lnrho, const int3 vertexIdx) {
+momentum(in VectorField uu, in ScalarField lnrho, const int3 vertexIdx) {
  Vector mom;

  const Matrix S = stress_tensor(uu);
@@ -99,7 +99,7 @@ momentum(in Vector uu, in Scalar lnrho, const int3 vertexIdx) {
 }

 Vector
-induction(in Vector uu, in Vector aa) {
+induction(in VectorField uu, in VectorField aa) {
  // Note: We do (-nabla^2 A + nabla(nabla dot A)) instead of (nabla x (nabla
  // x A)) in order to avoid taking the first derivative twice (did the math,
  // yes this actually works. See pg.28 in arXiv:astro-ph/0109497)
@@ -116,15 +116,15 @@ induction(in Vector uu, in Vector aa) {

 // Declare input and output arrays using locations specified in the
 // array enum in astaroth.h
-in Scalar lnrho = VTXBUF_LNRHO;
-out Scalar out_lnrho = VTXBUF_LNRHO;
+in ScalarField lnrho(VTXBUF_LNRHO);
+out ScalarField out_lnrho(VTXBUF_LNRHO);

-in Vector uu = (int3) {VTXBUF_UUX, VTXBUF_UUY, VTXBUF_UUZ};
-out Vector out_uu = (int3) {VTXBUF_UUX,VTXBUF_UUY,VTXBUF_UUZ};
+in VectorField uu(VTXBUF_UUX, VTXBUF_UUY, VTXBUF_UUZ);
+out VectorField out_uu(VTXBUF_UUX,VTXBUF_UUY,VTXBUF_UUZ);

 #if LMAGNETIC
-in Vector aa = (int3) {VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ};
-out Vector out_aa = (int3) {VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ};
+in VectorField aa(VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ);
+out VectorField out_aa(VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ);
 #endif

 Kernel void
@@ -137,38 +137,3 @@ solve(Scalar dt) {

  WRITE(out_uu, RK3(out_uu, uu, momentum(uu, lnrho, vertexIdx), dt));
 }
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
--- a/acc/pseudodisk/stencil_process_linegrav.sps
+++ b/acc/pseudodisk/stencil_process_linegrav.sps
@@ -43,19 +43,19 @@ distance_x(Vector a, Vector b)
 }

 Vector
-value(in Vector uu)
+value(in VectorField uu)
 {
    return (Vector){value(uu.x), value(uu.y), value(uu.z)};
 }

 Matrix
-gradients(in Vector uu)
+gradients(in VectorField uu)
 {
    return (Matrix){gradient(uu.x), gradient(uu.y), gradient(uu.z)};
 }

 Scalar
-continuity(in Vector uu, in Scalar lnrho) {
+continuity(in VectorField uu, in ScalarField lnrho) {
    return -dot(value(uu), gradient(lnrho)) - divergence(uu);
 }

@@ -84,7 +84,7 @@ grav_force_line(const int3 vertexIdx)

 #if LENTROPY
 Vector
-momentum(in Vector uu, in Scalar lnrho, in Scalar ss, in Vector aa, const int3 vertexIdx) {
+momentum(in VectorField uu, in ScalarField lnrho, in ScalarField ss, in VectorField aa, const int3 vertexIdx) {
  Vector mom;

  const Matrix S = stress_tensor(uu);
@@ -109,7 +109,7 @@ momentum(in Vector uu, in Scalar lnrho, in Scalar ss, in Vector aa, const int3 v
 }
 #else
 Vector
-momentum(in Vector uu, in Scalar lnrho, const int3 vertexIdx) {
+momentum(in VectorField uu, in ScalarField lnrho, const int3 vertexIdx) {
  Vector mom;

  const Matrix S = stress_tensor(uu);
@@ -128,7 +128,7 @@ momentum(in Vector uu, in Scalar lnrho, const int3 vertexIdx) {


 Vector
-induction(in Vector uu, in Vector aa) {
+induction(in VectorField uu, in VectorField aa) {
  // Note: We do (-nabla^2 A + nabla(nabla dot A)) instead of (nabla x (nabla
  // x A)) in order to avoid taking the first derivative twice (did the math,
  // yes this actually works. See pg.28 in arXiv:astro-ph/0109497)
@@ -146,7 +146,7 @@ induction(in Vector uu, in Vector aa) {

 #if LENTROPY
 Scalar
-lnT( in Scalar ss, in Scalar lnrho) {
+lnT( in ScalarField ss, in ScalarField lnrho) {
  const Scalar lnT = LNT0 + value(ss) / cp_sound +
    (gamma - AcReal(1.)) * (value(lnrho) - LNRHO0);
  return lnT;
@@ -154,7 +154,7 @@ lnT( in Scalar ss, in Scalar lnrho) {

 // Nabla dot (K nabla T) / (rho T)
 Scalar
-heat_conduction( in Scalar ss, in Scalar lnrho) {
+heat_conduction( in ScalarField ss, in ScalarField lnrho) {
  const Scalar inv_cp_sound = AcReal(1.) / cp_sound;

  const Vector grad_ln_chi = (Vector) {
@@ -179,7 +179,7 @@ heating(const int i, const int j, const int k) {
 }

 Scalar
-entropy(in Scalar ss, in Vector uu, in Scalar lnrho, in Vector aa) {
+entropy(in ScalarField ss, in VectorField uu, in ScalarField lnrho, in VectorField aa) {
    const Matrix S = stress_tensor(uu);

    // nabla x nabla x A / mu0 = nabla(nabla dot A) - nabla^2(A)
@@ -198,21 +198,20 @@ entropy(in Scalar ss, in Vector uu, in Scalar lnrho, in Vector aa) {

 // Declare input and output arrays using locations specified in the
 // array enum in astaroth.h
-in Scalar lnrho = VTXBUF_LNRHO;
-out Scalar out_lnrho = VTXBUF_LNRHO;
-
-in Vector uu = (int3) {VTXBUF_UUX, VTXBUF_UUY, VTXBUF_UUZ};
-out Vector out_uu = (int3) {VTXBUF_UUX,VTXBUF_UUY,VTXBUF_UUZ};
+in ScalarField lnrho(VTXBUF_LNRHO);
+out ScalarField out_lnrho(VTXBUF_LNRHO);

+in VectorField uu(VTXBUF_UUX, VTXBUF_UUY, VTXBUF_UUZ);
+out VectorField out_uu(VTXBUF_UUX,VTXBUF_UUY,VTXBUF_UUZ);

 #if LMAGNETIC
-in Vector aa = (int3) {VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ};
-out Vector out_aa = (int3) {VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ};
+in VectorField aa(VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ);
+out VectorField out_aa(VTXBUF_AX,VTXBUF_AY,VTXBUF_AZ);
 #endif

 #if LENTROPY
-in Scalar ss = VTXBUF_ENTROPY;
-out Scalar out_ss = VTXBUF_ENTROPY;
+in ScalarField ss(VTXBUF_ENTROPY);
+out ScalarField out_ss(VTXBUF_ENTROPY);
 #endif

 Kernel void
--- a/acc/samples/common_header.h
+++ b/acc/samples/common_header.h
@@ -1,422 +0,0 @@
-/*
-    Copyright (C) 2014-2019, Johannes Pekkilae, Miikka Vaeisalae.
-
-    This file is part of Astaroth.
-
-    Astaroth is free software: you can redistribute it and/or modify
-    it under the terms of the GNU General Public License as published by
-    the Free Software Foundation, either version 3 of the License, or
-    (at your option) any later version.
-
-    Astaroth is distributed in the hope that it will be useful,
-    but WITHOUT ANY WARRANTY; without even the implied warranty of
-    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-    GNU General Public License for more details.
-
-    You should have received a copy of the GNU General Public License
-    along with Astaroth.  If not, see <http://www.gnu.org/licenses/>.
-*/
-
-/**
- * @file
- * \brief Brief info.
- *
- * Provides an interface to Astaroth. Contains all the necessary configuration
- * structs and functions for running the code on multiple GPUs.
- *
- * All interface functions declared here (such as acInit()) operate all GPUs
- * available in the node under the hood, and the user does not need any
- * information about the decomposition, synchronization or such to use these
- * functions.
- *
- */
-#pragma once
-
-/* Prevent name mangling */
-#ifdef __cplusplus
-extern "C" {
-#endif
-
-#include <float.h>        // FLT_EPSILON, etc
-#include <stdlib.h>       // size_t
-#include <vector_types.h> // CUDA vector types (float4, etc)
-
-
-/*
- * =============================================================================
- * Flags for auto-optimization
- * =============================================================================
- */
-#define AUTO_OPTIMIZE (0) // DEPRECATED TODO remove
-#define BOUNDCONDS_OPTIMIZE (0)
-#define GENERATE_BENCHMARK_DATA (0)
-
-// Device info
-#define REGISTERS_PER_THREAD (255)
-#define MAX_REGISTERS_PER_BLOCK (65536)
-#define MAX_THREADS_PER_BLOCK (1024)
-#define MAX_TB_DIM (MAX_THREADS_PER_BLOCK)
-#define NUM_ITERATIONS (10)
-#define WARP_SIZE (32)
-
-
-/*
- * =============================================================================
- * Compile-time constants used during simulation (user definable)
- * =============================================================================
- */
-#define STENCIL_ORDER (6)
-
-///////////// PAD TEST
-// NOTE: works only with nx is divisible by 32
-//#define PAD_LEAD (32 - STENCIL_ORDER/2)
-//#define PAD_SIZE (32 - STENCIL_ORDER)
-///////////// PAD TEST
-
-// L-prefix inherited from the old Astaroth, no idea what it means
-// MV: L means a Logical switch variale, something having true of false value.
-#define LFORCING (0) // Note: forcing is disabled currently in the files generated by acc (compiler of our DSL)
-#define LMAGNETIC (1)
-#define LENTROPY (1)
-#define LTEMPERATURE (0)
-
-#define AC_THERMAL_CONDUCTIVITY (AcReal(0.001)) // TODO: make an actual config parameter
-
-/*
- * =============================================================================
- * Identifiers used to construct the parameter lists for AcMeshInfo
- * (IntParamType and RealParamType)
- * (user definable)
- * =============================================================================
- */
-// clang-format off
-#define AC_FOR_INT_PARAM_TYPES(FUNC)\
-        /* cparams */\
-        FUNC(AC_nx), \
-        FUNC(AC_ny), \
-        FUNC(AC_nz), \
-        FUNC(AC_mx), \
-        FUNC(AC_my), \
-        FUNC(AC_mz), \
-        FUNC(AC_nx_min), \
-        FUNC(AC_ny_min), \
-        FUNC(AC_nz_min), \
-        FUNC(AC_nx_max), \
-        FUNC(AC_ny_max), \
-        FUNC(AC_nz_max), \
-        /* Other */\
-        FUNC(AC_max_steps), \
-        FUNC(AC_save_steps), \
-        FUNC(AC_bin_steps), \
-        FUNC(AC_bc_type), \
-        /* Additional */\
-        FUNC(AC_mxy),\
-        FUNC(AC_nxy),\
-        FUNC(AC_nxyz)
-#define AC_FOR_REAL_PARAM_TYPES(FUNC)\
-        /* cparams */\
-        FUNC(AC_dsx), \
-        FUNC(AC_dsy), \
-        FUNC(AC_dsz), \
-        FUNC(AC_dsmin), \
-        /* physical grid*/\
-        FUNC(AC_xlen), \
-        FUNC(AC_ylen), \
-        FUNC(AC_zlen), \
-        FUNC(AC_xorig), \
-        FUNC(AC_yorig), \
-        FUNC(AC_zorig), \
-        /*Physical units*/\
-        FUNC(AC_unit_density),\
-        FUNC(AC_unit_velocity),\
-        FUNC(AC_unit_length),\
-        /* properties of gravitating star*/\
-        FUNC(AC_star_pos_x),\
-        FUNC(AC_star_pos_y),\
-        FUNC(AC_star_pos_z),\
-        FUNC(AC_M_star),\
-        /* Run params */\
-        FUNC(AC_cdt), \
-        FUNC(AC_cdtv), \
-        FUNC(AC_cdts), \
-        FUNC(AC_nu_visc), \
-        FUNC(AC_cs_sound), \
-        FUNC(AC_eta), \
-        FUNC(AC_mu0), \
-        FUNC(AC_relhel), \
-        FUNC(AC_cp_sound), \
-        FUNC(AC_gamma), \
-        FUNC(AC_cv_sound), \
-        FUNC(AC_lnT0), \
-        FUNC(AC_lnrho0), \
-        FUNC(AC_zeta), \
-        FUNC(AC_trans),\
-        /* Other */\
-        FUNC(AC_bin_save_t), \
-        /* Initial condition params */\
-        FUNC(AC_ampl_lnrho), \
-        FUNC(AC_ampl_uu), \
-        FUNC(AC_angl_uu), \
-        FUNC(AC_lnrho_edge),\
-        FUNC(AC_lnrho_out),\
-        /* Additional helper params */\
-        /* (deduced from other params do not set these directly!) */\
-        FUNC(AC_G_CONST),\
-        FUNC(AC_GM_star),\
-        FUNC(AC_sq2GM_star),\
-        FUNC(AC_cs2_sound), \
-        FUNC(AC_inv_dsx), \
-        FUNC(AC_inv_dsy), \
-        FUNC(AC_inv_dsz)
-// clang-format on
-
-/*
- * =============================================================================
- * Identifiers for VertexBufferHandle
- * (i.e. the arrays used to construct AcMesh)
- * (user definable)
- * =============================================================================
- */
-// clang-format off
-#define AC_FOR_HYDRO_VTXBUF_HANDLES(FUNC)\
-        FUNC(VTXBUF_LNRHO), \
-        FUNC(VTXBUF_UUX), \
-        FUNC(VTXBUF_UUY), \
-        FUNC(VTXBUF_UUZ), \
-        // FUNC(VTXBUF_DYE),
-
-#if LMAGNETIC
-#define AC_FOR_MAGNETIC_VTXBUF_HANDLES(FUNC)\
-        FUNC(VTXBUF_AX), \
-        FUNC(VTXBUF_AY), \
-        FUNC(VTXBUF_AZ),
-#else
-#define AC_FOR_MAGNETIC_VTXBUF_HANDLES(FUNC)
-#endif
-
-#if LENTROPY
-#define AC_FOR_ENTROPY_VTXBUF_HANDLES(FUNC)\
-        FUNC(VTXBUF_ENTROPY),
-#else
-#define AC_FOR_ENTROPY_VTXBUF_HANDLES(FUNC)
-#endif
-
-#if LTEMPERATURE
-#define AC_FOR_TEMPERATURE_VTXBUF_HANDLES(FUNC)\
-        FUNC(VTXBUF_TEMPERATURE),
-#else
-#define AC_FOR_TEMPERATURE_VTXBUF_HANDLES(FUNC)
-#endif
-
-#define AC_FOR_VTXBUF_HANDLES(FUNC)\
-        AC_FOR_HYDRO_VTXBUF_HANDLES(FUNC)\
-        AC_FOR_MAGNETIC_VTXBUF_HANDLES(FUNC)\
-        AC_FOR_ENTROPY_VTXBUF_HANDLES(FUNC)\
-        AC_FOR_TEMPERATURE_VTXBUF_HANDLES(FUNC)
-// clang-format on
-
-/*
- * =============================================================================
- * Single/double precision switch
- * =============================================================================
- */
-#if AC_DOUBLE_PRECISION == 1
-typedef double AcReal;
-typedef double3 AcReal3;
-#define AC_REAL_MAX (DBL_MAX)
-#define AC_REAL_MIN (DBL_MIN)
-#define AC_REAL_EPSILON (DBL_EPSILON)
-#else
-typedef float AcReal;
-typedef float3 AcReal3;
-#define AC_REAL_MAX (FLT_MAX)
-#define AC_REAL_MIN (FLT_MIN)
-#define AC_REAL_EPSILON (FLT_EPSILON)
-#endif
-
-typedef struct {
-    AcReal3 row[3];
-} AcMatrix;
-
-/*
- * =============================================================================
- * Helper macros
- * =============================================================================
- */
-#define AC_GEN_ID(X) X
-#define AC_GEN_STR(X) #X
-
-/*
- * =============================================================================
- * Error codes
- * =============================================================================
- */
-typedef enum { AC_SUCCESS = 0, AC_FAILURE = 1 } AcResult;
-
-/*
- * =============================================================================
- * Reduction types
- * =============================================================================
- */
-typedef enum {
-    RTYPE_MAX,
-    RTYPE_MIN,
-    RTYPE_RMS,
-    RTYPE_RMS_EXP,
-    NUM_REDUCTION_TYPES
-} ReductionType;
-
-/*
- * =============================================================================
- * Definitions for the enums and structs for AcMeshInfo (DO NOT TOUCH)
- * =============================================================================
- */
-typedef enum {
-    AC_FOR_INT_PARAM_TYPES(AC_GEN_ID),
-    NUM_INT_PARAMS
-} AcIntParam;
-
-typedef enum {
-    AC_FOR_REAL_PARAM_TYPES(AC_GEN_ID),
-    NUM_REAL_PARAMS
-} AcRealParam;
-
-extern const char* intparam_names[];  // Defined in astaroth.cu
-extern const char* realparam_names[]; // Defined in astaroth.cu
-
-typedef struct {
-    int int_params[NUM_INT_PARAMS];
-    AcReal real_params[NUM_REAL_PARAMS];
-} AcMeshInfo;
-
-/*
- * =============================================================================
- * Definitions for the enums and structs for AcMesh (DO NOT TOUCH)
- * =============================================================================
- */
-typedef enum {
-    AC_FOR_VTXBUF_HANDLES(AC_GEN_ID) NUM_VTXBUF_HANDLES
-} VertexBufferHandle;
-
-extern const char* vtxbuf_names[]; // Defined in astaroth.cu
-
-/*
-typedef struct {
-    AcReal* data;
-} VertexBuffer;
-*/
-
-// NOTE: there's no particular benefit declaring AcMesh a class, since
-// a library user may already have allocated memory for the vertex_buffers.
-// But then we would allocate memory again when the user wants to start
-// filling the class with data. => Its better to consider AcMesh as a
-// payload-only struct
-typedef struct {
-    AcReal* vertex_buffer[NUM_VTXBUF_HANDLES];
-    AcMeshInfo info;
-} AcMesh;
-
-#define acVertexBufferSize(mesh_info)                                              \
-    ((size_t)(mesh_info.int_params[AC_mx] * mesh_info.int_params[AC_my] *      \
-              mesh_info.int_params[AC_mz]))
-
-#define acVertexBufferSizeBytes(mesh_info)                                        \
-    (sizeof(AcReal) * acVertexBufferSize(mesh_info))
-
-#define acVertexBufferCompdomainSize(mesh_info)                                   \
-    (mesh_info.int_params[AC_nx] * mesh_info.int_params[AC_ny] *               \
-     mesh_info.int_params[AC_nz])
-
-#define acVertexBufferCompdomainSizeBytes(mesh_info)                             \
-    (sizeof(AcReal) * acVertexBufferCompdomainSize(mesh_info))
-
-#define acVertexBufferIdx(i, j, k, mesh_info)                                      \
-    ((i) + (j)*mesh_info.int_params[AC_mx] +                                   \
-     (k)*mesh_info.int_params[AC_mx] * mesh_info.int_params[AC_my])
-
-/*
- * =============================================================================
- * Astaroth interface
- * =============================================================================
- */
-/** Starting point of all GPU computation. Handles the allocation and
-initialization of *all memory needed on all GPUs in the node*. In other words,
-setups everything GPU-side so that calling any other GPU interface function
-afterwards does not result in illegal memory accesses. */
-AcResult acInit(const AcMeshInfo& mesh_info);
-
-/** Splits the host_mesh and distributes it among the GPUs in the node */
-AcResult acLoad(const AcMesh& host_mesh);
-AcResult acLoadWithOffset(const AcMesh& host_mesh, const int3& start, const int num_vertices);
-
-/** Does all three steps of the RK3 integration and computes the boundary
-conditions when necessary. Note that the boundary conditions are not applied
-after the final integration step.
-The result can be fetched to CPU memory with acStore(). */
-AcResult acIntegrate(const AcReal& dt);
-
-/** Performs a single RK3 step without computing boundary conditions. */
-AcResult acIntegrateStep(const int& isubstep, const AcReal& dt);
-
-/** Applies boundary conditions on the GPU meshs and communicates the
- ghost zones among GPUs if necessary */
-AcResult acBoundcondStep(void);
-
-/** Performs a scalar reduction on all GPUs in the node and returns the result.
- */
-AcReal acReduceScal(const ReductionType& rtype, const VertexBufferHandle& a);
-
-/** Performs a vector reduction on all GPUs in the node and returns the result.
- */
-AcReal acReduceVec(const ReductionType& rtype, const VertexBufferHandle& a,
-                   const VertexBufferHandle& b, const VertexBufferHandle& c);
-
-/** Stores the mesh distributed among GPUs of the node back to a single host
- * mesh */
-AcResult acStore(AcMesh* host_mesh);
-AcResult acStoreWithOffset(const int3& start, const int num_vertices, AcMesh* host_mesh);
-
-/** Frees all GPU allocations and resets all devices in the node. Should be
- * called at exit. */
-AcResult acQuit(void);
-
-/** Synchronizes all devices. All calls to Astaroth are asynchronous by default
-    unless otherwise stated. */
-AcResult acSynchronize(void);
-
-/* End extern "C" */
-#ifdef __cplusplus
-}
-#endif
-
-/*
- * =============================================================================
- * Notes
- * =============================================================================
- */
-/*
-typedef enum {
-    VTX_BUF_LNRHO,
-    VTX_BUF_UUX,
-    VTX_BUF_UUY,
-    VTX_BUF_UUZ,
-    NUM_VERTEX_BUFFER_HANDLES
-} VertexBufferHandle
-
-// LNRHO etc
-typedef struct {
-    AcReal* data;
-} VertexBuffer;
-
-// Host
-typedef struct {
-    VertexBuffer vertex_buffers[NUM_VERTEX_BUFFER_HANDLES];
-    MeshInfo info;
-} Mesh;
-
-// Device
-typedef struct {
-    VertexBuffer in[NUM_VERTEX_BUFFER_HANDLES];
-    VertexBuffer out[NUM_VERTEX_BUFFER_HANDLES];
-} VertexBufferArray;
-*/
--- a/acc/samples/sample_stencil_assembly.sas
+++ b/acc/samples/sample_stencil_assembly.sas
@@ -1,49 +0,0 @@
-// TODO comments and reformatting
-
-//Scalar
-//dostuff(in Scalar uux)
-//{
-//   return uux[vertexIdx.x, vertexIdx.y, vertexIdx.z];
-//}
-
-// stencil_assembly.in
-Preprocessed Scalar
-some_exotic_stencil_computation(in Scalar uux)
-{
-    //#if STENCIL_ORDER == 2
-    //    const Scalar coefficients[] = {1, 1, 1};
-    //#else if STENCIL_ORDER == 4
-    //    const Scalar coefficients[] = {....};
-    //#endif
-
-    int i = vertexIdx.x;
-    int j = vertexIdx.y;
-    int k = vertexIdx.z;
-    const Scalar coefficients[] = {1, 2, 3};
-
-    return coefficients[0] * uux[i-1, j, k] + 
-           coefficients[1] * uux[i, j, k] + 
-           coefficients[2] * uux[i+1, j, k];
-}
-
-// stencil_process.in
-//in Scalar uux_in = VTXBUF_UUX;
-//out Scalar uux_out = VTXBUF_UUX;
-
-
-//Kernel
-//solve(Scalar dt)
-//{
-//    uux_out = some_exotic_stencil(uux_in);
-//}
-
-
-
-
-
-
-
-
-
-
-
--- a/acc/samples/sample_stencil_process.sps
+++ b/acc/samples/sample_stencil_process.sps
@@ -1,149 +0,0 @@
-// TODO comments and reformatting
-
-uniform Scalar dsx;
-uniform Scalar dsy;
-uniform Scalar dsz;
-
-uniform Scalar GM_star;
-// Other uniforms types than Scalar or int not yet supported
-
-// BUILTIN
-//Scalar dot(...){}
-
-// BUILTIN
-//Scalar distance(Vector a, Vector b) { return sqrt(dot(a, b)); }
-
-// BUILTIN
-// Scalar first_derivative(Scalar pencil[], Scalar inv_ds) { return pencil[3] * inv_ds; }
-
-Scalar first_derivative(Scalar pencil[], Scalar inv_ds)
-{
-    Scalar res = 0;
-    for (int i = 0; i < STENCIL_ORDER+1; ++i) {
-        res = res + pencil[i];
-    }
-    return inv_ds * res;
-}
-
-Scalar distance(Vector a, Vector b)
-{
-    return sqrt(a.x * b.x + a.y * b.y + a.z * b.z); 
-}
-
-Scalar
-gravity_potential(int i, int j, int k)
-{
-    Vector star_pos = (Vector){0, 0, 0};
-    Vector vertex_pos = (Vector){dsx * i, dsy * j, dsz * k};
-    return GM_star / distance(star_pos, vertex_pos);
-}
-
-Scalar
-gradx_gravity_potential(int i, int j, int k)
-{
-    Scalar pencil[STENCIL_ORDER + 1];
-    for (int offset = -STENCIL_ORDER; offset <= STENCIL_ORDER; ++offset) {
-        pencil[offset+STENCIL_ORDER] = gravity_potential(i + offset, j, k);
-    }
-
-    Scalar inv_ds = Scalar(1.) / dsx;
-    return first_derivative(pencil, inv_ds);
-}
-
-Scalar
-grady_gravity_potential(int i, int j, int k)
-{
-    Scalar pencil[STENCIL_ORDER + 1];
-    for (int offset = -STENCIL_ORDER; offset <= STENCIL_ORDER; ++offset) {
-        pencil[offset+STENCIL_ORDER] = gravity_potential(i, j + offset, k);
-    }
-
-    Scalar inv_ds = Scalar(1.) / dsy;
-    return first_derivative(pencil, inv_ds);
-}
-
-Scalar
-gradz_gravity_potential(int i, int j, int k)
-{
-    Scalar pencil[STENCIL_ORDER + 1];
-    for (int offset = -STENCIL_ORDER; offset <= STENCIL_ORDER; ++offset) {
-        pencil[offset+STENCIL_ORDER] = gravity_potential(i, j, k + offset);
-    }
-
-    Scalar inv_ds = Scalar(1.) / dsz;
-    return first_derivative(pencil, inv_ds);
-}
-
-Vector
-momentum(int i, int j, int k, in Vector uu)
-{
-
-    Vector gravity_potential = (Vector){gradx_gravity_potential(i, j, k),
-                                      grady_gravity_potential(i, j, k),
-                                      gradz_gravity_potential(i, j, k)};
-
-
-    return gravity_potential;
-}
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
--- a/acc/src/acc.l
+++ b/acc/src/acc.l
@@ -15,6 +15,8 @@ L [a-zA-Z_]
 "void"      { return VOID; } /* Rest of the types inherited from C */
 "int"       { return INT; }
 "int3"      { return INT3; }
+"ScalarField" { return SCALAR; }
+"VectorField" { return VECTOR; }

 "Kernel"       { return KERNEL; } /* Function specifiers */
 "Preprocessed" { return PREPROCESSED; }
--- a/acc/src/acc.y
+++ b/acc/src/acc.y
@@ -101,6 +101,7 @@ exec_statement: declaration
              ;

 assignment: declaration '=' expression                                                  { $$ = astnode_create(NODE_UNKNOWN, $1, $3); $$->infix = '='; }
+          | declaration '(' expression_list ')'                                         { $$ = astnode_create(NODE_UNKNOWN, $1, $3); $$->infix = '('; $$->postfix = ')'; } // C++ style initializer
          | expression '=' expression                                                   { $$ = astnode_create(NODE_UNKNOWN, $1, $3); $$->infix = '='; }
          ;

--- a/acc/src/code_generator.c
+++ b/acc/src/code_generator.c
@@ -229,8 +229,11 @@ translate_latest_symbol(void)
    // IN / OUT
    else if (symbol->type != SYMBOLTYPE_FUNCTION_PARAMETER &&
             (symbol->type_qualifier == IN || symbol->type_qualifier == OUT)) {
-        const char* inout_type_qualifier = "static __device__ const auto";
-        printf("%s %s%s", inout_type_qualifier, inout_name_prefix, symbol_table[handle].identifier);
+
+        printf("static __device__ const %s %s%s", symbol->type_specifier == SCALAR ? "int" : "int3",
+               inout_name_prefix, symbol_table[handle].identifier);
+        if (symbol->type_specifier == VECTOR)
+            printf(" = make_int3");
    }
    // OTHER
    else {
@@ -335,8 +338,8 @@ traverse(const ASTNode* node)
    // Preprocessed parameter boilerplate
    if (node->type == NODE_TYPE_QUALIFIER && node->token == PREPROCESSED)
        inside_preprocessed = true;
-    static const char
-        preprocessed_parameter_boilerplate[] = "const int3 vertexIdx, const int3 globalVertexIdx, ";
+    static const char preprocessed_parameter_boilerplate
+        [] = "const int3& vertexIdx, const int3& globalVertexIdx, ";
    if (inside_preprocessed && node->type == NODE_FUNCTION_PARAMETER_DECLARATION)
        printf("%s ", preprocessed_parameter_boilerplate);
    // BOILERPLATE END////////////////////////////////////////////////////////
@@ -491,8 +494,8 @@ generate_preprocessed_structures(void)

    // FILLING THE DATA STRUCT
    printf("static __device__ __forceinline__ AcRealData\
-            read_data(const int3 vertexIdx,\
-                const int3 globalVertexIdx,\
+            read_data(const int3& vertexIdx,\
+                const int3& globalVertexIdx,\
            AcReal* __restrict__ buf[], const int handle)\
            {\n\
                %sData data;\n",
@@ -527,8 +530,8 @@ generate_preprocessed_structures(void)
        } AcReal3Data;\
        \
        static __device__ __forceinline__ AcReal3Data\
-        read_data(const int3 vertexIdx,\
-                  const int3 globalVertexIdx,\
+        read_data(const int3& vertexIdx,\
+                  const int3& globalVertexIdx,\
                  AcReal* __restrict__ buf[], const int3& handle)\
        {\
            AcReal3Data data;\
--- a/include/astaroth.h
+++ b/include/astaroth.h
@@ -49,6 +49,10 @@ AcResult acInit(const AcMeshInfo mesh_info);
 * called at exit. */
 AcResult acQuit(void);

+/** Checks whether there are any CUDA devices available. Returns AC_SUCCESS if there is 1 or more,
+ * AC_FAILURE otherwise. */
+AcResult acCheckDeviceAvailability(void);
+
 /** Synchronizes a specific stream. All streams are synchronized if STREAM_ALL is passed as a
 * parameter*/
 AcResult acSynchronizeStream(const Stream stream);
@@ -66,8 +70,8 @@ AcResult acStore(AcMesh* host_mesh);
 * substep and the user is responsible for calling acBoundcondStep before reading the data. */
 AcResult acIntegrate(const AcReal dt);

-/** Applies periodic boundary conditions for the Mesh distributed among the devices visible to the
- * caller*/
+/** Applies periodic boundary conditions for the Mesh distributed among the devices visible to
+ * the caller*/
 AcResult acBoundcondStep(void);

 /** Does a scalar reduction with the data stored in some vertex buffer */
@@ -81,6 +85,14 @@ AcReal acReduceVec(const ReductionType rtype, const VertexBufferHandle a,
 */
 AcResult acStoreWithOffset(const int3 dst, const size_t num_vertices, AcMesh* host_mesh);

+/** Will potentially be deprecated in later versions. Added only to fix backwards compatibility with
+ * PC for now.*/
+AcResult acIntegrateStep(const int isubstep, const AcReal dt);
+AcResult acIntegrateStepWithOffset(const int isubstep, const AcReal dt, const int3 start,
+                                   const int3 end);
+AcResult acSynchronize(void);
+AcResult acLoadWithOffset(const AcMesh host_mesh, const int3 src, const int num_vertices);
+
 #ifdef __cplusplus
 } // extern "C"
 #endif
--- a/include/astaroth_defines.h
+++ b/include/astaroth_defines.h
@@ -44,8 +44,6 @@ typedef struct {
 } double3;
 #endif // __CUDACC__

-#include "stencil_defines.h"
-
 // Library flags
 #define VERBOSE_PRINTING (1)

@@ -68,6 +66,8 @@ typedef struct {
    AcReal3 row[3];
 } AcMatrix;

+#include "stencil_defines.h" // User-defined header
+
 // clang-format off
 #define AC_FOR_BUILTIN_INT_PARAM_TYPES(FUNC)\
        FUNC(AC_nx), \
--- a/src/core/astaroth.cu
+++ b/src/core/astaroth.cu
@@ -19,6 +19,9 @@
 // #include "astaroth_defines.h"
 #include "astaroth.h"

+#include "errchk.h"
+#include "math_utils.h" // int3 + int3
+
 #define AC_GEN_STR(X) #X
 const char* intparam_names[]   = {AC_FOR_BUILTIN_INT_PARAM_TYPES(AC_GEN_STR) //
                                AC_FOR_USER_INT_PARAM_TYPES(AC_GEN_STR)};
@@ -33,10 +36,13 @@ const char* vtxbuf_names[]     = {AC_FOR_VTXBUF_HANDLES(AC_GEN_STR)};

 static const int num_nodes = 1;
 static Node nodes[num_nodes];
+static int3 grid_n;

 AcResult
 acInit(const AcMeshInfo mesh_info)
 {
+    grid_n = (int3){mesh_info.int_params[AC_nx], mesh_info.int_params[AC_ny],
+                    mesh_info.int_params[AC_nz]};
    return acNodeCreate(0, mesh_info, &nodes[0]);
 }

@@ -46,6 +52,23 @@ acQuit(void)
    return acNodeDestroy(nodes[0]);
 }

+AcResult
+acCheckDeviceAvailability(void)
+{
+    int device_count; // Separate from num_devices to avoid side effects
+    ERRCHK_CUDA_ALWAYS(cudaGetDeviceCount(&device_count));
+    if (device_count > 0)
+        return AC_SUCCESS;
+    else
+        return AC_FAILURE;
+}
+
+AcResult
+acSynchronize(void)
+{
+    return acNodeSynchronizeStream(nodes[0], STREAM_ALL);
+}
+
 AcResult
 acSynchronizeStream(const Stream stream)
 {
@@ -80,6 +103,20 @@ acIntegrate(const AcReal dt)
    return acNodeIntegrate(nodes[0], dt);
 }

+AcResult
+acIntegrateStep(const int isubstep, const AcReal dt)
+{
+    const int3 start = (int3){NGHOST, NGHOST, NGHOST};
+    const int3 end   = start + grid_n;
+    return acNodeIntegrateSubstep(nodes[0], STREAM_DEFAULT, isubstep, start, end, dt);
+}
+
+AcResult
+acIntegrateStepWithOffset(const int isubstep, const AcReal dt, const int3 start, const int3 end)
+{
+    return acNodeIntegrateSubstep(nodes[0], STREAM_DEFAULT, isubstep, start, end, dt);
+}
+
 AcResult
 acBoundcondStep(void)
 {
@@ -108,3 +145,9 @@ acStoreWithOffset(const int3 dst, const size_t num_vertices, AcMesh* host_mesh)
 {
    return acNodeStoreMeshWithOffset(nodes[0], STREAM_DEFAULT, dst, dst, num_vertices, host_mesh);
 }
+
+AcResult
+acLoadWithOffset(const AcMesh host_mesh, const int3 src, const int num_vertices)
+{
+    return acNodeLoadMeshWithOffset(nodes[0], STREAM_DEFAULT, host_mesh, src, src, num_vertices);
+}
--- a/src/core/kernels/integration.cuh
+++ b/src/core/kernels/integration.cuh
@@ -46,6 +46,9 @@ IDX(const int3 idx)
    return DEVICE_VTXBUF_IDX(idx.x, idx.y, idx.z);
 }

+#define make_int3(a, b, c)                                                                         \
+    (int3) { (int)a, (int)b, (int)c }
+
 static __forceinline__ AcMatrix
 create_rotz(const AcReal radians)
 {
--- a/src/standalone/model/model_rk3.cc
+++ b/src/standalone/model/model_rk3.cc
@@ -282,14 +282,11 @@ der6x_upwd(const int i, const int j, const int k, const ModelScalar* arr)
 {
    ModelScalar inv_ds = get(AC_inv_dsx);

-    return ModelScalar(1.0/60.0)*inv_ds* (
-          -ModelScalar(    20.0)* arr[IDX(i,   j,   k)]
-          +ModelScalar(    15.0)*(arr[IDX(i+1, j,   k)]
-          +                       arr[IDX(i-1, j,   k)])
-          -ModelScalar(     6.0)*(arr[IDX(i+2, j,   k)]
-          +                       arr[IDX(i-2, j,   k)])
-          +                       arr[IDX(i+3, j,   k)]
-          +                       arr[IDX(i-3, j,   k)]);
+    return ModelScalar(1.0 / 60.0) * inv_ds *
+           (-ModelScalar(20.0) * arr[IDX(i, j, k)] +
+            ModelScalar(15.0) * (arr[IDX(i + 1, j, k)] + arr[IDX(i - 1, j, k)]) -
+            ModelScalar(6.0) * (arr[IDX(i + 2, j, k)] + arr[IDX(i - 2, j, k)]) +
+            arr[IDX(i + 3, j, k)] + arr[IDX(i - 3, j, k)]);
 }

 static inline ModelScalar
@@ -297,14 +294,11 @@ der6y_upwd(const int i, const int j, const int k, const ModelScalar* arr)
 {
    ModelScalar inv_ds = get(AC_inv_dsy);

-    return ModelScalar(1.0/60.0)*inv_ds* (
-          -ModelScalar(    20.0)* arr[IDX(i,   j,   k)]
-          +ModelScalar(    15.0)*(arr[IDX(i,   j+1, k)]
-          +                       arr[IDX(i,   j-1, k)])
-          -ModelScalar(     6.0)*(arr[IDX(i,   j+2, k)]
-          +                       arr[IDX(i,   j-2, k)])
-          +                       arr[IDX(i,   j+3, k)]
-          +                       arr[IDX(i,   j-3, k)]);
+    return ModelScalar(1.0 / 60.0) * inv_ds *
+           (-ModelScalar(20.0) * arr[IDX(i, j, k)] +
+            ModelScalar(15.0) * (arr[IDX(i, j + 1, k)] + arr[IDX(i, j - 1, k)]) -
+            ModelScalar(6.0) * (arr[IDX(i, j + 2, k)] + arr[IDX(i, j - 2, k)]) +
+            arr[IDX(i, j + 3, k)] + arr[IDX(i, j - 3, k)]);
 }

 static inline ModelScalar
@@ -312,14 +306,11 @@ der6z_upwd(const int i, const int j, const int k, const ModelScalar* arr)
 {
    ModelScalar inv_ds = get(AC_inv_dsz);

-    return ModelScalar(1.0/60.0)*inv_ds* (
-          -ModelScalar(    20.0)* arr[IDX(i,   j,   k  )]
-          +ModelScalar(    15.0)*(arr[IDX(i,   j,   k+1)]
-          +                       arr[IDX(i,   j,   k-1)])
-          -ModelScalar(     6.0)*(arr[IDX(i,   j,   k+2)]
-          +                       arr[IDX(i,   j,   k-2)])
-          +                       arr[IDX(i,   j,   k+3)]
-          +                       arr[IDX(i,   j,   k-3)]);
+    return ModelScalar(1.0 / 60.0) * inv_ds *
+           (-ModelScalar(20.0) * arr[IDX(i, j, k)] +
+            ModelScalar(15.0) * (arr[IDX(i, j, k + 1)] + arr[IDX(i, j, k - 1)]) -
+            ModelScalar(6.0) * (arr[IDX(i, j, k + 2)] + arr[IDX(i, j, k - 2)]) +
+            arr[IDX(i, j, k + 3)] + arr[IDX(i, j, k - 3)]);
 }
 #endif

@@ -339,7 +330,8 @@ compute_gradient(const int i, const int j, const int k, const ModelScalar* arr)
 static inline ModelVector
 compute_upwind(const int i, const int j, const int k, const ModelScalar* arr)
 {
-    return (ModelVector){der6x_upwd(i, j, k, arr), der6y_upwd(i, j, k, arr), der6z_upwd(i, j, k, arr)};
+    return (ModelVector){der6x_upwd(i, j, k, arr), der6y_upwd(i, j, k, arr),
+                         der6z_upwd(i, j, k, arr)};
 }
 #endif

@@ -416,8 +408,6 @@ gradients(const ModelVectorData& data)
    return (ModelMatrix){gradient(data.x), gradient(data.y), gradient(data.z)};
 }

-
-
 /*
 * =============================================================================
 * Level 0.3 (Built-in functions available during the Stencil Processing Stage)
@@ -571,10 +561,10 @@ contract(const ModelMatrix& mat)
 ModelScalar
 upwd_der6(const ModelVectorData& uu, const ModelScalarData& lnrho)
 {
-    ModelScalar uux = fabs(value(uu).x);
-    ModelScalar uuy = fabs(value(uu).y);
-    ModelScalar uuz = fabs(value(uu).z);
-    return uux*lnrho.upwind.x + uuy*lnrho.upwind.y + uuz*lnrho.upwind.z;
+    ModelScalar uux = fabsl(value(uu).x);
+    ModelScalar uuy = fabsl(value(uu).y);
+    ModelScalar uuz = fabsl(value(uu).z);
+    return uux * lnrho.upwind.x + uuy * lnrho.upwind.y + uuz * lnrho.upwind.z;
 }
 #endif

@@ -583,7 +573,7 @@ continuity(const ModelVectorData& uu, const ModelScalarData& lnrho)
 {
    return -dot(value(uu), gradient(lnrho))
 #if LUPWD
-           //This is a corrective hyperdiffusion term for upwinding.
+           // This is a corrective hyperdiffusion term for upwinding.
           + upwd_der6(uu, lnrho)
 #endif
           - divergence(uu);
@@ -760,24 +750,23 @@ helical_forcing(ModelScalar magnitude, ModelVector k_force, ModelVector xx, Mode
                ModelVector ff_im, ModelScalar phi)
 {
    (void)magnitude; // WARNING: unused
-    xx.x = xx.x*(2.0*M_PI/(get(AC_dsx)*get(AC_nx)));
-    xx.y = xx.y*(2.0*M_PI/(get(AC_dsy)*get(AC_ny)));
-    xx.z = xx.z*(2.0*M_PI/(get(AC_dsz)*get(AC_nz)));
+    xx.x = xx.x * (2.0 * M_PI / (get(AC_dsx) * get(AC_nx)));
+    xx.y = xx.y * (2.0 * M_PI / (get(AC_dsy) * get(AC_ny)));
+    xx.z = xx.z * (2.0 * M_PI / (get(AC_dsz) * get(AC_nz)));

    ModelScalar cos_phi     = cosl(phi);
    ModelScalar sin_phi     = sinl(phi);
    ModelScalar cos_k_dot_x = cosl(dot(k_force, xx));
    ModelScalar sin_k_dot_x = sinl(dot(k_force, xx));
    // Phase affect only the x-component
-    //Scalar real_comp       = cos_k_dot_x;
-    //Scalar imag_comp       = sin_k_dot_x;
-    ModelScalar real_comp_phase = cos_k_dot_x*cos_phi - sin_k_dot_x*sin_phi;
-    ModelScalar imag_comp_phase = cos_k_dot_x*sin_phi + sin_k_dot_x*cos_phi;
+    // Scalar real_comp       = cos_k_dot_x;
+    // Scalar imag_comp       = sin_k_dot_x;
+    ModelScalar real_comp_phase = cos_k_dot_x * cos_phi - sin_k_dot_x * sin_phi;
+    ModelScalar imag_comp_phase = cos_k_dot_x * sin_phi + sin_k_dot_x * cos_phi;

-
-    ModelVector force = (ModelVector){ ff_re.x*real_comp_phase - ff_im.x*imag_comp_phase,
-                             ff_re.y*real_comp_phase - ff_im.y*imag_comp_phase,
-                             ff_re.z*real_comp_phase - ff_im.z*imag_comp_phase};
+    ModelVector force = (ModelVector){ff_re.x * real_comp_phase - ff_im.x * imag_comp_phase,
+                                      ff_re.y * real_comp_phase - ff_im.y * imag_comp_phase,
+                                      ff_re.z * real_comp_phase - ff_im.z * imag_comp_phase};

    return force;
 }