Context Navigation

← Previous Change
Next Change →

shallow_water_ext.c

Timestamp:

Jun 2, 2009, 8:52:47 AM (15 years ago)

Author:

ole

Message:

Thought a bit more about the flux optimisation implemented in changeset:7105

The y-momentum limiter has been reinstated. Instead, I implemented a cut-off for limiting the momentum as described in the manual (see Section about flux limiter). For the simple profile compute_fluxes now takes 2.964s (as opposed to 4.284s prior to changeset:7105) and the overall runtime of evolve takes 9.797s (as opposed to 10.909s). For the okushiri example the timings are now 109.551s for compute_fluxes and 293.314s overall.

Overall this amounts to a 10% overall performance improvement.

See also changeset:6703 for past timings

These timings were conducted on a 3.0GHz Intel Core-2 running Ubuntu Linux.

I had to updated a few tests that used to compare to exact values that are now slightly different.

File:

: 1 edited

anuga_core/source/anuga/shallow_water/shallow_water_ext.c (modified) (14 diffs)

Legend:

: Unmodified
: Added
: Removed

anuga_core/source/anuga/shallow_water/shallow_water_ext.c

-                      r7105
+                      r7143
                       double *h,
                       double epsilon,
+                      double h0) {
+                      double h0,
+                      double limiting_threshold) {
   double u;
+  if (*h < epsilon) {
+    *h = 0.0;  // Could have been negative
+    u = 0.0;
+  if (*h < limiting_threshold) {
+    // Apply limiting of speeds according to the ANUGA manual
+    if (*h < epsilon) {
+      *h = 0.0;  // Could have been negative
+      u = 0.0;
+    } else {
+      u = *uh/(*h + h0/ *h);
+    }
+    // Adjust momentum to be consistent with speed
+    *uh = u * *h;
   } else {
+    u = *uh/(*h + h0/ *h);
+    // We are in deep water - no need for limiting
+    u = *uh/ *h;
+  }
-  // Adjust momentum to be consistent with speed
-  *uh = u * *h;
   return u;
 …
                            double z_left, double z_right,
                            double n1, double n2,
+                           double epsilon, double H0, double g,
+                           double epsilon,
+                           double h0,
+                           double limiting_threshold,
+                           double g,
                            double *edgeflux, double *max_speed)
+{
 …
   double w_left, h_left, uh_left, vh_left, u_left;
   double w_right, h_right, uh_right, vh_right, u_right;
-  //double v_left, v_right;
   double s_min, s_max, soundspeed_left, soundspeed_right;
   double denom, inverse_denominator, z;
 …
   static double q_left_rotated[3], q_right_rotated[3], flux_right[3], flux_left[3];
-  double h0 = H0*H0; // This ensures a good balance when h approaches H0.
-                     // But evidence suggests that h0 can be as little as
-                     // epsilon!
   // Copy conserved quantities to protect from modification
   q_left_rotated[0] = q_left[0];
 …
   h_left = w_left - z;
   uh_left = q_left_rotated[1];
+  u_left = _compute_speed(&uh_left, &h_left, epsilon, h0);
+  u_left = _compute_speed(&uh_left, &h_left,
+                          epsilon, h0, limiting_threshold);
   w_right = q_right_rotated[0];
   h_right = w_right - z;
   uh_right = q_right_rotated[1];
+  u_right = _compute_speed(&uh_right, &h_right, epsilon, h0);
+  u_right = _compute_speed(&uh_right, &h_right,
+                           epsilon, h0, limiting_threshold);
   // Momentum in y-direction
 …
   // Leaving this out, improves speed significantly (Ole 27/5/2009)
   // All validation tests pass, so do we really need it anymore?
+  //v_left = _compute_speed(&vh_left, &h_left, epsilon, h0);
+  //v_right = _compute_speed(&vh_right, &h_right, epsilon, h0);
+  _compute_speed(&vh_left, &h_left,
+                 epsilon, h0, limiting_threshold);
+  _compute_speed(&vh_right, &h_right,
+                 epsilon, h0, limiting_threshold);
   // Maximal and minimal wave speeds
 …
   denom = s_max - s_min;
   if (denom < epsilon)
   { // FIXME (Ole): Try using H0 here
+  { // FIXME (Ole): Try using h0 here
     memset(edgeflux, 0, 3*sizeof(double));
     *max_speed = 0.0;
 …
   double h0 = H0*H0; //This ensures a good balance when h approaches H0.
+  double limiting_threshold = 10*H0; // Avoid applying limiter below this
   //Copy conserved quantities to protect from modification
   for (i=0; i<3; i++) {
 …
   h_left = w_left-z;
   uh_left = q_left_rotated[1];
+  u_left =_compute_speed(&uh_left, &h_left, epsilon, h0);
+  u_left =_compute_speed(&uh_left, &h_left,
+                         epsilon, h0, limiting_threshold);
   w_right = q_right_rotated[0];
   h_right = w_right-z;
   uh_right = q_right_rotated[1];
+  u_right =_compute_speed(&uh_right, &h_right, epsilon, h0);
+  u_right =_compute_speed(&uh_right, &h_right,
+                          epsilon, h0, limiting_threshold);
 …
   PyArrayObject *normal, *ql, *qr,  *edgeflux;
   double g, epsilon, max_speed, H0, zl, zr;
+  double h0, limiting_threshold;
   if (!PyArg_ParseTuple(args, "OOOddOddd",
 …
+  h0 = H0*H0; // This ensures a good balance when h approaches H0.
+              // But evidence suggests that h0 can be as little as
+              // epsilon!
+  limiting_threshold = 10*H0; // Avoid applying limiter below this
+                              // threshold for performance reasons.
+                              // See ANUGA manual under flux limiting
   _flux_function_central((double*) ql -> data,
+             (double*) qr -> data,
+             zl,
+             zr,
+             ((double*) normal -> data)[0],
+             ((double*) normal -> data)[1],
+             epsilon, H0, g,
+             (double*) edgeflux -> data,
+             &max_speed);
+                         (double*) qr -> data,
+                         zl,
+                         zr,
+                         ((double*) normal -> data)[0],
+                         ((double*) normal -> data)[1],
+                         epsilon, h0, limiting_threshold,
+                         g,
+                         (double*) edgeflux -> data,
+                         &max_speed);
   return Py_BuildValue("d", max_speed);
 …
   // Local variables
   double max_speed, length, inv_area, zl, zr;
+  double h0 = H0*H0; // This ensures a good balance when h approaches H0.
+  double limiting_threshold = 10*H0; // Avoid applying limiter below this
+                                     // threshold for performance reasons.
+                                     // See ANUGA manual under flux limiting
   int k, i, m, n;
   int ki, nm=0, ki2; // Index shorthands
   // Workspace (making them static actually made function slightly slower (Ole))
 …
   static long call = 1; // Static local variable flagging already computed flux
   // Start computation
   call++; // Flag 'id' of flux calculation for this timestep
 …
       _flux_function_central(ql, qr, zl, zr,
                              normals[ki2], normals[ki2+1],
                              epsilon, H0, g,
+                             epsilon, h0, limiting_threshold, g,
                              edgeflux, &max_speed);

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changeset 7143 for anuga_core/source/anuga/shallow_water/shallow_water_ext.c

Legend:

anuga_core/source/anuga/shallow_water/shallow_water_ext.c

Download in other formats: