# CUDA_PROFILE_LOG_VERSION 2.0 # CUDA_DEVICE 0 GeForce GTX 480 # CUDA_CONTEXT 1 # TIMESTAMPFACTOR fffff685dfc5b298 method,gputime,cputime,occupancy method=[ memcpyHtoDasync ] gputime=[ 0.992 ] cputime=[ 25.000 ] method=[ memcpyHtoDasync ] gputime=[ 0.800 ] cputime=[ 8.000 ] method=[ memcpyHtoDasync ] gputime=[ 0.768 ] cputime=[ 11.000 ] method=[ memcpyHtoDasync ] gputime=[ 1.440 ] cputime=[ 11.000 ] method=[ memcpyHtoDasync ] gputime=[ 1.440 ] cputime=[ 13.000 ] method=[ memcpyHtoDasync ] gputime=[ 1.472 ] cputime=[ 10.000 ] method=[ memcpyHtoDasync ] gputime=[ 58.528 ] cputime=[ 158.000 ] method=[ memcpyHtoDasync ] gputime=[ 236.000 ] cputime=[ 561.000 ] method=[ memcpyHtoDasync ] gputime=[ 219.424 ] cputime=[ 447.000 ] method=[ memcpyHtoDasync ] gputime=[ 219.552 ] cputime=[ 413.000 ] method=[ memcpyHtoDasync ] gputime=[ 617.152 ] cputime=[ 815.000 ] method=[ memcpyHtoDasync ] gputime=[ 203.968 ] cputime=[ 374.000 ] method=[ memcpyHtoDasync ] gputime=[ 69.376 ] cputime=[ 172.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.976 ] cputime=[ 124.000 ] method=[ memcpyHtoDasync ] gputime=[ 70.112 ] cputime=[ 120.000 ] method=[ memcpyHtoDasync ] gputime=[ 62.912 ] cputime=[ 118.000 ] method=[ memcpyHtoDasync ] gputime=[ 3.296 ] cputime=[ 14.000 ] method=[ memcpyHtoDasync ] gputime=[ 0.800 ] cputime=[ 10.000 ] method=[ memcpyHtoDasync ] gputime=[ 556.288 ] cputime=[ 641.000 ] method=[ memcpyHtoDasync ] gputime=[ 565.664 ] cputime=[ 749.000 ] method=[ memcpyHtoDasync ] gputime=[ 132.608 ] cputime=[ 256.000 ] method=[ memcpyHtoDasync ] gputime=[ 65.216 ] cputime=[ 142.000 ] method=[ memcpyHtoDasync ] gputime=[ 198.400 ] cputime=[ 286.000 ] method=[ memcpyHtoDasync ] gputime=[ 197.888 ] cputime=[ 345.000 ] method=[ memcpyHtoDasync ] gputime=[ 198.496 ] cputime=[ 341.000 ] method=[ memcpyHtoDasync ] gputime=[ 198.720 ] cputime=[ 345.000 ] method=[ memcpyHtoDasync ] gputime=[ 199.872 ] cputime=[ 343.000 ] method=[ memcpyHtoDasync ] gputime=[ 196.480 ] cputime=[ 339.000 ] method=[ memcpyHtoDasync ] gputime=[ 182.016 ] cputime=[ 340.000 ] method=[ memcpyHtoDasync ] gputime=[ 3.424 ] cputime=[ 19.000 ] method=[ memcpyHtoDasync ] gputime=[ 2.944 ] cputime=[ 8.000 ] method=[ memcpyHtoDasync ] gputime=[ 2.016 ] cputime=[ 10.000 ] method=[ memcpyHtoDasync ] gputime=[ 2.944 ] cputime=[ 9.000 ] method=[ memcpyHtoDasync ] gputime=[ 3.104 ] cputime=[ 10.000 ] method=[ memcpyHtoDasync ] gputime=[ 3.360 ] cputime=[ 8.000 ] method=[ memcpyHtoDasync ] gputime=[ 2.016 ] cputime=[ 6.000 ] method=[ memcpyHtoDasync ] gputime=[ 73.408 ] cputime=[ 92.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.528 ] cputime=[ 143.000 ] method=[ memcpyHtoDasync ] gputime=[ 65.856 ] cputime=[ 117.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.880 ] cputime=[ 115.000 ] method=[ memcpyHtoDasync ] gputime=[ 76.576 ] cputime=[ 122.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.976 ] cputime=[ 125.000 ] method=[ memcpyHtoDasync ] gputime=[ 180.352 ] cputime=[ 285.000 ] method=[ memcpyHtoDasync ] gputime=[ 197.920 ] cputime=[ 430.000 ] method=[ memcpyHtoDasync ] gputime=[ 198.048 ] cputime=[ 338.000 ] method=[ memcpyHtoDasync ] gputime=[ 196.640 ] cputime=[ 343.000 ] method=[ memcpyHtoDasync ] gputime=[ 68.704 ] cputime=[ 164.000 ] method=[ memcpyHtoDasync ] gputime=[ 67.392 ] cputime=[ 121.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.304 ] cputime=[ 113.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.624 ] cputime=[ 116.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.272 ] cputime=[ 116.000 ] method=[ memcpyHtoDasync ] gputime=[ 68.096 ] cputime=[ 114.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.272 ] cputime=[ 116.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.656 ] cputime=[ 114.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.688 ] cputime=[ 113.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.080 ] cputime=[ 114.000 ] method=[ memcpyHtoDasync ] gputime=[ 65.952 ] cputime=[ 112.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.240 ] cputime=[ 114.000 ] method=[ memcpyHtoDasync ] gputime=[ 75.168 ] cputime=[ 113.000 ] method=[ memcpyHtoDasync ] gputime=[ 65.344 ] cputime=[ 169.000 ] method=[ memcpyHtoDasync ] gputime=[ 224.096 ] cputime=[ 295.000 ] method=[ memcpyHtoDasync ] gputime=[ 63.616 ] cputime=[ 205.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.336 ] cputime=[ 78.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.080 ] cputime=[ 115.000 ] method=[ memcpyHtoDasync ] gputime=[ 194.144 ] cputime=[ 288.000 ] method=[ memcpyHtoDasync ] gputime=[ 65.216 ] cputime=[ 162.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.112 ] cputime=[ 88.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.400 ] cputime=[ 116.000 ] method=[ memcpyHtoDasync ] gputime=[ 195.040 ] cputime=[ 287.000 ] method=[ memcpyHtoDasync ] gputime=[ 65.568 ] cputime=[ 162.000 ] method=[ memcpyHtoDasync ] gputime=[ 66.080 ] cputime=[ 87.000 ] method=[ memcpyHtoDasync ] gputime=[ 57.696 ] cputime=[ 117.000 ] method=[ _protect_sw ] gputime=[ 9.120 ] cputime=[ 19.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 22.784 ] cputime=[ 6.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 201.600 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 25.056 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.992 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 21.952 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 209.792 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.896 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 8.160 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.432 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.776 ] cputime=[ 12.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.888 ] cputime=[ 594.000 ] method=[ gravity_wb ] gputime=[ 122.080 ] cputime=[ 8.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 379.328 ] cputime=[ 1091.000 ] method=[ _manning_friction_flat ] gputime=[ 5.568 ] cputime=[ 12.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.976 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 17.248 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 17.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.352 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.376 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 374.880 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.672 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.176 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.296 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.928 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.080 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.040 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 758.000 ] method=[ gravity_wb ] gputime=[ 123.168 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.664 ] cputime=[ 836.000 ] method=[ _manning_friction_flat ] gputime=[ 5.920 ] cputime=[ 11.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.416 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.600 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 381.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.224 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.800 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.336 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.016 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 792.000 ] method=[ gravity_wb ] gputime=[ 122.688 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.088 ] cputime=[ 794.000 ] method=[ _manning_friction_flat ] gputime=[ 10.016 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.672 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.664 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 377.536 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.704 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.240 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 446.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 786.000 ] method=[ gravity_wb ] gputime=[ 123.360 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.472 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.536 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.688 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.440 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 374.848 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.192 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.704 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.912 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 31.488 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.568 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.664 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.728 ] cputime=[ 794.000 ] method=[ gravity_wb ] gputime=[ 123.648 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.312 ] cputime=[ 794.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.544 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.152 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 374.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.352 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.496 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.832 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.784 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.920 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 784.000 ] method=[ gravity_wb ] gputime=[ 122.976 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 379.232 ] cputime=[ 856.000 ] method=[ _manning_friction_flat ] gputime=[ 5.632 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.248 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.032 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.216 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 371.040 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.096 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.704 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.824 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 453.792 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 786.000 ] method=[ gravity_wb ] gputime=[ 123.552 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.184 ] cputime=[ 794.000 ] method=[ _manning_friction_flat ] gputime=[ 5.472 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.016 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.728 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.736 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 380.736 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.352 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.528 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.272 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 801.000 ] method=[ gravity_wb ] gputime=[ 123.712 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.632 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.472 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.112 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.384 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 20.448 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 370.720 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.040 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.336 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.376 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.576 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 782.000 ] method=[ gravity_wb ] gputime=[ 123.264 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.832 ] cputime=[ 794.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.144 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.024 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 370.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.128 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.336 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.896 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 789.000 ] method=[ gravity_wb ] gputime=[ 123.296 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.824 ] cputime=[ 790.000 ] method=[ _manning_friction_flat ] gputime=[ 5.920 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.352 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.928 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 368.832 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.608 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 441.920 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 775.000 ] method=[ gravity_wb ] gputime=[ 123.552 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 374.016 ] cputime=[ 848.000 ] method=[ _manning_friction_flat ] gputime=[ 6.016 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 7.968 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.960 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 362.752 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 23.808 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.880 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 776.000 ] method=[ gravity_wb ] gputime=[ 123.680 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.952 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.504 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.336 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.952 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.320 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.568 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 363.328 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.352 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.800 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.040 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.176 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.112 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 453.728 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 779.000 ] method=[ gravity_wb ] gputime=[ 123.136 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.928 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.728 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.864 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 360.384 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.928 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.592 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.072 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 29.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 453.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.312 ] cputime=[ 750.000 ] method=[ gravity_wb ] gputime=[ 124.288 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.824 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.568 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.784 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.176 ] cputime=[ 8.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.632 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.216 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 366.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.000 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.104 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.176 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.072 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 807.000 ] method=[ gravity_wb ] gputime=[ 123.040 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 422.208 ] cputime=[ 831.000 ] method=[ _manning_friction_flat ] gputime=[ 5.760 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.760 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.248 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.928 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 361.824 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 23.840 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.240 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.248 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.688 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 781.000 ] method=[ gravity_wb ] gputime=[ 123.840 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 370.304 ] cputime=[ 827.000 ] method=[ _manning_friction_flat ] gputime=[ 5.696 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 25.888 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.792 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.216 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.248 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 360.672 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.256 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.016 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.912 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.144 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.584 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 775.000 ] method=[ gravity_wb ] gputime=[ 123.648 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.120 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.440 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.592 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.568 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.664 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 366.848 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.352 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.112 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.224 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 779.000 ] method=[ gravity_wb ] gputime=[ 124.000 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.984 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.824 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.896 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 362.720 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.832 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.496 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 2.944 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 453.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 62.176 ] cputime=[ 781.000 ] method=[ gravity_wb ] gputime=[ 124.352 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 375.328 ] cputime=[ 841.000 ] method=[ _manning_friction_flat ] gputime=[ 5.760 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.000 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.504 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 366.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.192 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 768.000 ] method=[ gravity_wb ] gputime=[ 124.608 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 370.272 ] cputime=[ 832.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.848 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 6.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.736 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.568 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 357.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.576 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.728 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.824 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.120 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 773.000 ] method=[ gravity_wb ] gputime=[ 124.448 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.056 ] cputime=[ 797.000 ] method=[ _manning_friction_flat ] gputime=[ 5.408 ] cputime=[ 11.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.208 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.696 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 359.648 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.160 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.304 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.608 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.368 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.952 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.768 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 774.000 ] method=[ gravity_wb ] gputime=[ 123.872 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.440 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.440 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.688 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.792 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.888 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.248 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 361.536 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.192 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.016 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.408 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.176 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 775.000 ] method=[ gravity_wb ] gputime=[ 123.392 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.312 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.608 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.120 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 357.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 23.872 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.672 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.016 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.960 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 778.000 ] method=[ gravity_wb ] gputime=[ 124.064 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.504 ] cputime=[ 790.000 ] method=[ _manning_friction_flat ] gputime=[ 5.856 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.856 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.280 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 362.816 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.992 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.088 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 782.000 ] method=[ gravity_wb ] gputime=[ 123.712 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 374.464 ] cputime=[ 859.000 ] method=[ _manning_friction_flat ] gputime=[ 5.760 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.952 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.760 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.728 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.760 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.792 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.448 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.824 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 355.424 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.128 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.040 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.952 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.408 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 441.888 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.600 ] cputime=[ 762.000 ] method=[ gravity_wb ] gputime=[ 124.160 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.728 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.792 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.496 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.480 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 356.448 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.640 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.912 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.272 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.088 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.144 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 766.000 ] method=[ gravity_wb ] gputime=[ 123.840 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.440 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.376 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.248 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 358.944 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.128 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.208 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.496 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 18.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.016 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.488 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 761.000 ] method=[ gravity_wb ] gputime=[ 123.168 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.600 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.632 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.848 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.120 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 357.984 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.608 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.992 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 442.624 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 790.000 ] method=[ gravity_wb ] gputime=[ 123.872 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 435.264 ] cputime=[ 853.000 ] method=[ _manning_friction_flat ] gputime=[ 5.504 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.144 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.112 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.352 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.536 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 355.392 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.984 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.912 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.992 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.328 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.536 ] cputime=[ 770.000 ] method=[ gravity_wb ] gputime=[ 123.200 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.568 ] cputime=[ 826.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.824 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.864 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 358.048 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 25.376 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.016 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 444.672 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 767.000 ] method=[ gravity_wb ] gputime=[ 123.584 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.248 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.760 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.632 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 7.968 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.768 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 357.728 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.320 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.560 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.952 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 450.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 773.000 ] method=[ gravity_wb ] gputime=[ 123.904 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.952 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.376 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 357.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.320 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.992 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.336 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.016 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 30.048 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.160 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.664 ] cputime=[ 791.000 ] method=[ gravity_wb ] gputime=[ 124.352 ] cputime=[ 8.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.832 ] cputime=[ 794.000 ] method=[ _manning_friction_flat ] gputime=[ 5.568 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.024 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.248 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 352.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.192 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.952 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.424 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 772.000 ] method=[ gravity_wb ] gputime=[ 124.416 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 374.976 ] cputime=[ 845.000 ] method=[ _manning_friction_flat ] gputime=[ 5.568 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.720 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.376 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 349.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.296 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.984 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.904 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 765.000 ] method=[ gravity_wb ] gputime=[ 123.264 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.184 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.728 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.336 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.704 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 356.224 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.592 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.400 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.048 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 446.272 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 767.000 ] method=[ gravity_wb ] gputime=[ 123.616 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.600 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.728 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.320 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.824 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 352.832 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.672 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.408 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.496 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.056 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 732.000 ] method=[ gravity_wb ] gputime=[ 124.320 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.408 ] cputime=[ 797.000 ] method=[ _manning_friction_flat ] gputime=[ 5.408 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 359.488 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.416 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.856 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 11.008 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.992 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 770.000 ] method=[ gravity_wb ] gputime=[ 123.904 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.920 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.472 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.280 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 353.664 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.512 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.144 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 450.816 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 768.000 ] method=[ gravity_wb ] gputime=[ 123.872 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.024 ] cputime=[ 808.000 ] method=[ _manning_friction_flat ] gputime=[ 5.536 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.944 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.728 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.384 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 18.112 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 359.424 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.160 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.984 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.976 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.896 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.824 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.864 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 777.000 ] method=[ gravity_wb ] gputime=[ 124.032 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.504 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.048 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.376 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 358.336 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.288 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.368 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.488 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 778.000 ] method=[ gravity_wb ] gputime=[ 124.576 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.792 ] cputime=[ 797.000 ] method=[ _manning_friction_flat ] gputime=[ 6.048 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.176 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.824 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.288 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.120 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 352.960 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.352 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.800 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 453.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 770.000 ] method=[ gravity_wb ] gputime=[ 124.032 ] cputime=[ 8.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.664 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.632 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.856 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 26.016 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.376 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 351.072 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.592 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.112 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 442.592 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 123.776 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.280 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.696 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.112 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.696 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.472 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 352.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 25.184 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.992 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.984 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.232 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 772.000 ] method=[ gravity_wb ] gputime=[ 123.680 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.600 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.656 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.760 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 349.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.352 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.416 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 765.000 ] method=[ gravity_wb ] gputime=[ 124.352 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.120 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.824 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.728 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.792 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 360.320 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.416 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.024 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.128 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 763.000 ] method=[ gravity_wb ] gputime=[ 123.072 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.728 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.696 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.672 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.984 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 356.800 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.416 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.952 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.880 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.592 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.248 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.144 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 457.984 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 779.000 ] method=[ gravity_wb ] gputime=[ 124.256 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.216 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.888 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.088 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 357.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.032 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.400 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 2.912 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.072 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 776.000 ] method=[ gravity_wb ] gputime=[ 124.608 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 370.048 ] cputime=[ 821.000 ] method=[ _manning_friction_flat ] gputime=[ 5.632 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 25.952 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.728 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.344 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 351.328 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.992 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.336 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.312 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 124.960 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.344 ] cputime=[ 797.000 ] method=[ _manning_friction_flat ] gputime=[ 5.632 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.720 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.824 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 348.896 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.160 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.672 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.136 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.240 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.824 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 453.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 764.000 ] method=[ gravity_wb ] gputime=[ 124.576 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.824 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 25.984 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.032 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.184 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 352.768 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.608 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.208 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.048 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.104 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.208 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.072 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.928 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 772.000 ] method=[ gravity_wb ] gputime=[ 123.840 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 377.024 ] cputime=[ 840.000 ] method=[ _manning_friction_flat ] gputime=[ 5.376 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.336 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.408 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 358.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.992 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.504 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.912 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.496 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.744 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 767.000 ] method=[ gravity_wb ] gputime=[ 124.864 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.696 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 11.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.184 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.088 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 352.992 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.096 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.208 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.176 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 438.976 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 753.000 ] method=[ gravity_wb ] gputime=[ 124.032 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.960 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.696 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.672 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.960 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 354.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.512 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.072 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.072 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 450.080 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 768.000 ] method=[ gravity_wb ] gputime=[ 123.776 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.952 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.240 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.312 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.592 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.832 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 751.000 ] method=[ gravity_wb ] gputime=[ 124.256 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.960 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.856 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.624 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.352 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 18.016 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 349.536 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.000 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.208 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.408 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 446.560 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.536 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 124.768 ] cputime=[ 8.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.984 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.568 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.784 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.760 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.296 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 25.120 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.592 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.072 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.992 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.952 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.104 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 124.192 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.992 ] cputime=[ 804.000 ] method=[ _manning_friction_flat ] gputime=[ 5.888 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.400 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.760 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.504 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 354.656 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.704 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.640 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.240 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.952 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.384 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 769.000 ] method=[ gravity_wb ] gputime=[ 124.320 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.984 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.408 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.352 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.928 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 352.992 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.864 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.624 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.336 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.280 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.032 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 763.000 ] method=[ gravity_wb ] gputime=[ 125.376 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.504 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.112 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.792 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 348.960 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.928 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.992 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.136 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.864 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 457.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 772.000 ] method=[ gravity_wb ] gputime=[ 124.544 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.888 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.536 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.216 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 353.056 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.192 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.688 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.008 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.984 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.248 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 767.000 ] method=[ gravity_wb ] gputime=[ 124.928 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.248 ] cputime=[ 803.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.120 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 344.736 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.672 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.072 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.304 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 457.024 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 765.000 ] method=[ gravity_wb ] gputime=[ 125.600 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.472 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.568 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.720 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.888 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.928 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 350.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.976 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.216 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.632 ] cputime=[ 768.000 ] method=[ gravity_wb ] gputime=[ 124.832 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.504 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.376 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.784 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.952 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.480 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.696 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 354.944 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.768 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.736 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.304 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 453.120 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.312 ] cputime=[ 749.000 ] method=[ gravity_wb ] gputime=[ 125.152 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.728 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.952 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.208 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.248 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.888 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.992 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 354.816 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.608 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.016 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.880 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.896 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.632 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 786.000 ] method=[ gravity_wb ] gputime=[ 124.512 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 436.096 ] cputime=[ 846.000 ] method=[ _manning_friction_flat ] gputime=[ 5.344 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.144 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.824 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 345.984 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.640 ] cputime=[ 15.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.368 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 447.776 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 747.000 ] method=[ gravity_wb ] gputime=[ 124.000 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 370.016 ] cputime=[ 808.000 ] method=[ _manning_friction_flat ] gputime=[ 5.728 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.728 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.320 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.152 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 358.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.112 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.952 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.552 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 772.000 ] method=[ gravity_wb ] gputime=[ 123.328 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.344 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.824 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 23.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.440 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 351.968 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.416 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.792 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.368 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 458.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 774.000 ] method=[ gravity_wb ] gputime=[ 124.832 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.664 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.504 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.496 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.568 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.720 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.768 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.832 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.088 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.048 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.424 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.536 ] cputime=[ 762.000 ] method=[ gravity_wb ] gputime=[ 123.872 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.440 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.536 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.560 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.184 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 356.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.576 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.088 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 768.000 ] method=[ gravity_wb ] gputime=[ 124.608 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.632 ] cputime=[ 808.000 ] method=[ _manning_friction_flat ] gputime=[ 5.376 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.112 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.832 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 352.064 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.416 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.896 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.976 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.304 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 459.808 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 774.000 ] method=[ gravity_wb ] gputime=[ 124.960 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.992 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.568 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.400 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.248 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.504 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 341.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.768 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.496 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.088 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.512 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 752.000 ] method=[ gravity_wb ] gputime=[ 124.576 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.696 ] cputime=[ 803.000 ] method=[ _manning_friction_flat ] gputime=[ 5.472 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.624 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.696 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.792 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 7.968 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.904 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.704 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.736 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.864 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.040 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.240 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.152 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 748.000 ] method=[ gravity_wb ] gputime=[ 123.744 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.888 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.376 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.176 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.184 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.936 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.576 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.568 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.608 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.896 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.880 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.720 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.296 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.216 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.952 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.312 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 764.000 ] method=[ gravity_wb ] gputime=[ 123.712 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.376 ] cputime=[ 797.000 ] method=[ _manning_friction_flat ] gputime=[ 5.536 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.528 ] cputime=[ 6.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.800 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.728 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 357.216 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.288 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.336 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 775.000 ] method=[ gravity_wb ] gputime=[ 124.960 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.056 ] cputime=[ 816.000 ] method=[ _manning_friction_flat ] gputime=[ 5.792 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.624 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.032 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.168 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.952 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.120 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 453.248 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 764.000 ] method=[ gravity_wb ] gputime=[ 124.608 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.792 ] cputime=[ 803.000 ] method=[ _manning_friction_flat ] gputime=[ 6.048 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.504 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 349.088 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.576 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.896 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.248 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.888 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.120 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 758.000 ] method=[ gravity_wb ] gputime=[ 124.768 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.472 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.728 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.120 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.904 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.576 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.912 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.368 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 447.296 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.312 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 124.736 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.568 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.440 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.336 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.888 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.312 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 339.424 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.768 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.848 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.240 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 457.664 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 762.000 ] method=[ gravity_wb ] gputime=[ 125.056 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.928 ] cputime=[ 809.000 ] method=[ _manning_friction_flat ] gputime=[ 5.824 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.176 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.352 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.216 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 344.544 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.992 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.864 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.048 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 453.984 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 761.000 ] method=[ gravity_wb ] gputime=[ 124.192 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.920 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.536 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.144 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.856 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.032 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.896 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 342.048 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.672 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.992 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.432 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.280 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 446.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 751.000 ] method=[ gravity_wb ] gputime=[ 124.512 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 370.112 ] cputime=[ 794.000 ] method=[ _manning_friction_flat ] gputime=[ 5.984 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.312 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 349.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.640 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.296 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.992 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.984 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.824 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.096 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 751.000 ] method=[ gravity_wb ] gputime=[ 124.800 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.472 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.536 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.240 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.320 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.344 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 345.792 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.416 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.240 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.800 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.688 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.896 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.856 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 759.000 ] method=[ gravity_wb ] gputime=[ 124.160 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.960 ] cputime=[ 788.000 ] method=[ _manning_friction_flat ] gputime=[ 5.760 ] cputime=[ 11.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.144 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.728 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.992 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 345.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 23.968 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.072 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.560 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 450.208 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 752.000 ] method=[ gravity_wb ] gputime=[ 125.088 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.728 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.536 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.568 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.752 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 25.024 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.112 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.008 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.632 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 124.288 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.632 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.440 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.248 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 339.680 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.896 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.264 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.832 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.120 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.888 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 446.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 738.000 ] method=[ gravity_wb ] gputime=[ 123.840 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.920 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.792 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.344 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 353.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.064 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.168 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.976 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.648 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.504 ] cputime=[ 773.000 ] method=[ gravity_wb ] gputime=[ 125.280 ] cputime=[ 8.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.728 ] cputime=[ 794.000 ] method=[ _manning_friction_flat ] gputime=[ 5.824 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.336 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.152 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.688 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.888 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 9.952 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.864 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.696 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 763.000 ] method=[ gravity_wb ] gputime=[ 124.448 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.920 ] cputime=[ 810.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.536 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 341.632 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.864 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.400 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.488 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 124.640 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.864 ] cputime=[ 797.000 ] method=[ _manning_friction_flat ] gputime=[ 5.504 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.736 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.792 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 343.104 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.672 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.048 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 754.000 ] method=[ gravity_wb ] gputime=[ 124.384 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 370.016 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.440 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.472 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 337.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.384 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.864 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.240 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.248 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 746.000 ] method=[ gravity_wb ] gputime=[ 124.576 ] cputime=[ 8.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.088 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.696 ] cputime=[ 11.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.728 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.768 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 344.768 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 25.536 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.080 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.912 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.984 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 28.800 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.544 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 763.000 ] method=[ gravity_wb ] gputime=[ 124.192 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.536 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.512 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.632 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 343.296 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.416 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.984 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.912 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.864 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.864 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 756.000 ] method=[ gravity_wb ] gputime=[ 124.032 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.088 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.728 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.048 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.184 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 350.720 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.512 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.728 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.800 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.104 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.232 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.920 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.408 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.784 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 769.000 ] method=[ gravity_wb ] gputime=[ 124.992 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.888 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.728 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.960 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 350.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.224 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.880 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 450.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 741.000 ] method=[ gravity_wb ] gputime=[ 124.352 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.728 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.376 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.088 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 354.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 23.936 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.720 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.952 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.416 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 772.000 ] method=[ gravity_wb ] gputime=[ 124.576 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.632 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.856 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.888 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.928 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 348.928 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.736 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.568 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.912 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.992 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 442.208 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 756.000 ] method=[ gravity_wb ] gputime=[ 124.672 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.408 ] cputime=[ 807.000 ] method=[ _manning_friction_flat ] gputime=[ 5.632 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.208 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 26.048 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.312 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 343.392 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 23.872 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.728 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.104 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.496 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.088 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.952 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 757.000 ] method=[ gravity_wb ] gputime=[ 124.384 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.760 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.376 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.112 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.320 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.928 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.040 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.320 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.112 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.640 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 762.000 ] method=[ gravity_wb ] gputime=[ 124.768 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.056 ] cputime=[ 797.000 ] method=[ _manning_friction_flat ] gputime=[ 5.760 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.792 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.728 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.352 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.088 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 340.864 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.384 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.016 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.176 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.648 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 758.000 ] method=[ gravity_wb ] gputime=[ 125.184 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.760 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.504 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.112 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.728 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.480 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.664 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.712 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.888 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.112 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 446.016 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 757.000 ] method=[ gravity_wb ] gputime=[ 123.872 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.864 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.536 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.112 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.288 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.440 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 349.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.448 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.928 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 14.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.024 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 746.000 ] method=[ gravity_wb ] gputime=[ 124.800 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.472 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.664 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.032 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.184 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 342.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.608 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.656 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.208 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.760 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.144 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 125.024 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.440 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.440 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.280 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.816 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.832 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.168 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 751.000 ] method=[ gravity_wb ] gputime=[ 124.896 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.536 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.760 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.352 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.568 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.200 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 25.312 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.824 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.936 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 765.000 ] method=[ gravity_wb ] gputime=[ 124.128 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.704 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.472 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.448 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 349.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.192 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.040 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.240 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.504 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 763.000 ] method=[ gravity_wb ] gputime=[ 125.440 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.664 ] cputime=[ 822.000 ] method=[ _manning_friction_flat ] gputime=[ 5.408 ] cputime=[ 11.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.632 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 349.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.016 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.768 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 124.192 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.024 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.856 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.600 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 354.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.000 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.640 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.688 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.688 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.248 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.240 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.872 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 767.000 ] method=[ gravity_wb ] gputime=[ 124.416 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.728 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.632 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.760 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.000 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.504 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 339.776 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.256 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.080 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.128 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 751.000 ] method=[ gravity_wb ] gputime=[ 124.864 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.960 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.792 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 342.720 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 25.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.048 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.752 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.952 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.536 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 758.000 ] method=[ gravity_wb ] gputime=[ 123.776 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.760 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.888 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.152 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.384 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.600 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.208 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.640 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.704 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.912 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.688 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.008 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.088 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.160 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 761.000 ] method=[ gravity_wb ] gputime=[ 125.472 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.248 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.472 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.216 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.184 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.328 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.736 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.408 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.792 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.984 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 757.000 ] method=[ gravity_wb ] gputime=[ 125.184 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.696 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.400 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.632 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.416 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.376 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 349.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.384 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.792 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.880 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.120 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.696 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 752.000 ] method=[ gravity_wb ] gputime=[ 124.736 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.960 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.144 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.888 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.728 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.928 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 344.928 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.384 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.896 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.040 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 784.000 ] method=[ gravity_wb ] gputime=[ 124.384 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.312 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.344 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.240 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.848 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.384 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.048 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 458.624 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 769.000 ] method=[ gravity_wb ] gputime=[ 124.096 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.056 ] cputime=[ 804.000 ] method=[ _manning_friction_flat ] gputime=[ 5.632 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.688 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.384 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 18.112 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.592 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.448 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.032 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 754.000 ] method=[ gravity_wb ] gputime=[ 124.544 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.824 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 6.048 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 12.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.344 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.712 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.640 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.768 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.144 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.016 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.952 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 458.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.472 ] cputime=[ 770.000 ] method=[ gravity_wb ] gputime=[ 126.304 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.800 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 6.272 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.856 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.248 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.448 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.928 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 332.416 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.960 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.432 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.296 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.744 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 746.000 ] method=[ gravity_wb ] gputime=[ 124.960 ] cputime=[ 8.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 370.016 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.440 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 27.072 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.536 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 345.696 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.160 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.912 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.824 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 439.200 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 750.000 ] method=[ gravity_wb ] gputime=[ 124.672 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.312 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.760 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.496 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.416 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.672 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 338.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.448 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.504 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.864 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 754.000 ] method=[ gravity_wb ] gputime=[ 124.096 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.856 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.824 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.016 ] cputime=[ 6.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.760 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.728 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 337.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.800 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.704 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.976 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.832 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.048 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 457.760 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 758.000 ] method=[ gravity_wb ] gputime=[ 125.664 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.024 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.440 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.320 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.888 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.008 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.288 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.144 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.496 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.216 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.272 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 445.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 738.000 ] method=[ gravity_wb ] gputime=[ 125.696 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.376 ] cputime=[ 803.000 ] method=[ _manning_friction_flat ] gputime=[ 5.504 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.960 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 344.320 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.880 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 450.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.600 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 124.480 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.344 ] cputime=[ 788.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.176 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.824 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.320 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.536 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.520 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.160 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.304 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.896 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.504 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.056 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.032 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 763.000 ] method=[ gravity_wb ] gputime=[ 125.280 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.824 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.696 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.960 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 345.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.896 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.992 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 446.112 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 755.000 ] method=[ gravity_wb ] gputime=[ 124.640 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.376 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.504 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.144 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.216 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.352 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 18.016 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 344.160 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.992 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.816 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.336 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.248 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.136 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 737.000 ] method=[ gravity_wb ] gputime=[ 124.000 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.632 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.856 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.376 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.928 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.944 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.992 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.136 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 767.000 ] method=[ gravity_wb ] gputime=[ 124.768 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.736 ] cputime=[ 794.000 ] method=[ _manning_friction_flat ] gputime=[ 5.632 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.792 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.888 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.496 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.224 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.072 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 450.144 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 758.000 ] method=[ gravity_wb ] gputime=[ 124.480 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.600 ] cputime=[ 808.000 ] method=[ _manning_friction_flat ] gputime=[ 5.408 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.288 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.152 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 346.720 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.544 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.016 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.832 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.688 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.144 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.864 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 446.944 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 755.000 ] method=[ gravity_wb ] gputime=[ 124.832 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.864 ] cputime=[ 797.000 ] method=[ _manning_friction_flat ] gputime=[ 5.568 ] cputime=[ 29.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.696 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.224 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.600 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 348.864 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.512 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.112 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.696 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.176 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.904 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 762.000 ] method=[ gravity_wb ] gputime=[ 124.288 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.792 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.976 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.576 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.152 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 344.384 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.576 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.704 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.944 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.824 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 452.928 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 758.000 ] method=[ gravity_wb ] gputime=[ 124.672 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.120 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.376 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.760 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.760 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.344 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 341.152 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.224 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.976 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.112 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 443.872 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 750.000 ] method=[ gravity_wb ] gputime=[ 124.960 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 370.112 ] cputime=[ 803.000 ] method=[ _manning_friction_flat ] gputime=[ 5.920 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 7.936 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.408 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 343.168 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.256 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.832 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.976 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.624 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.424 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 757.000 ] method=[ gravity_wb ] gputime=[ 124.800 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.672 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.440 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 342.464 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.288 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.728 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.896 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.688 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.400 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.376 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 753.000 ] method=[ gravity_wb ] gputime=[ 123.936 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.344 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.856 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.752 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.056 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.096 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.184 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 342.752 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.160 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.040 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.144 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.448 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 746.000 ] method=[ gravity_wb ] gputime=[ 125.024 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.896 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.696 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.184 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 341.024 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.512 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.920 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 444.000 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 752.000 ] method=[ gravity_wb ] gputime=[ 124.288 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.760 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.568 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.000 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.312 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 348.512 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.512 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.888 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 450.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 763.000 ] method=[ gravity_wb ] gputime=[ 125.376 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.248 ] cputime=[ 816.000 ] method=[ _manning_friction_flat ] gputime=[ 5.664 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.720 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.248 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 340.416 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.048 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.720 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.432 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.984 ] cputime=[ 15.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 745.000 ] method=[ gravity_wb ] gputime=[ 124.672 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.504 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.568 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.240 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.152 ] cputime=[ 14.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 342.496 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.704 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.544 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.848 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.264 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.864 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.440 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.040 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 754.000 ] method=[ gravity_wb ] gputime=[ 124.864 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.992 ] cputime=[ 796.000 ] method=[ _manning_friction_flat ] gputime=[ 5.504 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.464 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.280 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.152 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 335.552 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.672 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.952 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.992 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.832 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 463.232 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 764.000 ] method=[ gravity_wb ] gputime=[ 125.184 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.792 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.984 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.688 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.000 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.768 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 334.624 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.128 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.824 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.992 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.496 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.952 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 462.912 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 763.000 ] method=[ gravity_wb ] gputime=[ 125.056 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.024 ] cputime=[ 817.000 ] method=[ _manning_friction_flat ] gputime=[ 5.408 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.144 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.728 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.760 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 344.672 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.608 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.632 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.568 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.104 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.272 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.856 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.904 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 765.000 ] method=[ gravity_wb ] gputime=[ 124.992 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.824 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.280 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.472 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 7.968 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.248 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 340.800 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.736 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.240 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.992 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.496 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.392 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.824 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 448.064 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 753.000 ] method=[ gravity_wb ] gputime=[ 125.504 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.472 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 6.240 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.144 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.640 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.992 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 342.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.512 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.056 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.504 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.040 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.048 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.392 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 758.000 ] method=[ gravity_wb ] gputime=[ 125.408 ] cputime=[ 7.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 370.304 ] cputime=[ 802.000 ] method=[ _manning_friction_flat ] gputime=[ 5.888 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.248 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.064 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.376 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 343.360 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.512 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.184 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.952 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.040 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.304 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 449.824 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 757.000 ] method=[ gravity_wb ] gputime=[ 124.160 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.736 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.528 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.376 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.192 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.504 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 342.944 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.416 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.672 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.736 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.400 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.792 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 28.992 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 451.872 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 758.000 ] method=[ gravity_wb ] gputime=[ 124.672 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.632 ] cputime=[ 800.000 ] method=[ _manning_friction_flat ] gputime=[ 5.536 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.688 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.208 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.728 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 343.968 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.800 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.080 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.168 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.896 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.568 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.472 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 455.872 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 763.000 ] method=[ gravity_wb ] gputime=[ 124.672 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.672 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.856 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.208 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.856 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.312 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 341.824 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.416 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.696 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.768 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.976 ] cputime=[ 17.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.272 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.200 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.216 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.824 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 453.408 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 743.000 ] method=[ gravity_wb ] gputime=[ 125.856 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 376.224 ] cputime=[ 850.000 ] method=[ _manning_friction_flat ] gputime=[ 5.888 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.272 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.664 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.408 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.128 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 16.704 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 339.712 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.704 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.792 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.912 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.304 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.072 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 20.960 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.536 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.472 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 457.088 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.376 ] cputime=[ 753.000 ] method=[ gravity_wb ] gputime=[ 123.680 ] cputime=[ 8.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.184 ] cputime=[ 795.000 ] method=[ _manning_friction_flat ] gputime=[ 5.600 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.568 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.160 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.152 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 341.344 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.736 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.280 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.376 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.784 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.560 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.088 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 30.112 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.632 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 444.128 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.344 ] cputime=[ 750.000 ] method=[ gravity_wb ] gputime=[ 125.184 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.984 ] cputime=[ 810.000 ] method=[ _manning_friction_flat ] gputime=[ 5.888 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.368 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.792 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.256 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.088 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 347.488 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.736 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.120 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.816 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.232 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.216 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.536 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 454.144 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 766.000 ] method=[ gravity_wb ] gputime=[ 124.704 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 368.928 ] cputime=[ 799.000 ] method=[ _manning_friction_flat ] gputime=[ 5.952 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.400 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.080 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.760 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.824 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.416 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.440 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 335.360 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.704 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.656 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.560 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.120 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.440 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.024 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.016 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 446.656 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.408 ] cputime=[ 748.000 ] method=[ gravity_wb ] gputime=[ 124.832 ] cputime=[ 6.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.344 ] cputime=[ 801.000 ] method=[ _manning_friction_flat ] gputime=[ 5.696 ] cputime=[ 9.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.344 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.728 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.696 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.512 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.632 ] cputime=[ 4.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 342.592 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 25.312 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.440 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.928 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 22.048 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 7.008 ] cputime=[ 5.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.528 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.136 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.024 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 5.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.408 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 5.984 ] cputime=[ 3.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.504 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ compute_fluxes_central_structure_CUDA ] gputime=[ 446.304 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memcpyDtoHasync ] gputime=[ 61.440 ] cputime=[ 760.000 ] method=[ gravity_wb ] gputime=[ 126.240 ] cputime=[ 8.000 ] occupancy=[ 0.167 ] method=[ memcpyDtoH ] gputime=[ 369.120 ] cputime=[ 798.000 ] method=[ _manning_friction_flat ] gputime=[ 5.728 ] cputime=[ 10.000 ] occupancy=[ 0.750 ] method=[ update ] gputime=[ 26.752 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.312 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.632 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ update ] gputime=[ 25.600 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 5.664 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ _protect_sw ] gputime=[ 8.032 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ extrapolate_velocity_second_order_true ] gputime=[ 17.056 ] cputime=[ 5.000 ] occupancy=[ 0.667 ] method=[ extrapolate_second_order_sw_true ] gputime=[ 345.376 ] cputime=[ 5.000 ] occupancy=[ 0.333 ] method=[ _balance_deep_and_shallow ] gputime=[ 24.480 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.760 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 20.896 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ _interpolate_from_vertices_to_edges ] gputime=[ 21.248 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ evaluate_segment_reflective ] gputime=[ 6.752 ] cputime=[ 4.000 ] occupancy=[ 0.042 ] method=[ evaluate_segment_reflective ] gputime=[ 10.400 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ set_boundary_values_from_edges ] gputime=[ 3.104 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ update_centroids_of_velocities_and_height ] gputime=[ 21.152 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ extrapolate_first_order ] gputime=[ 29.664 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.600 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ extrapolate_first_order ] gputime=[ 29.344 ] cputime=[ 4.000 ] occupancy=[ 0.167 ] method=[ memset32_post ] gputime=[ 6.048 ] cputime=[ 4.000 ] occupancy=[ 0.333 ] method=[ memset32_post ] gputime=[ 9.408 ] cputime=[ 3.000 ] occupancy=[ 0.333 ]