|-> 31.190 - 100.000% [1] {min=31.190, max=31.190, mean=31.190, var=0.000, std dev=0.000} APEX MAIN | |-> 6.305 - 20.214% [350] {min=0.001, max=0.033, mean=0.018, var=0.000, std dev=0.006} Kokkos::parallel_for [HPX] EvalEOSForElems A | | |-> 1.799 - 5.769% [350] {min=0.000, max=0.012, mean=0.005, var=0.000, std dev=0.003} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 255.309 - 818.550% [51160] {min=0.000, max=0.017, mean=0.005, var=0.000, std dev=0.002} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 4.505 - 14.445% | |-> 3.751 - 12.026% [350] {min=0.001, max=0.016, mean=0.011, var=0.000, std dev=0.004} Kokkos::parallel_for [HPX] CalcEnergyForElems | | |-> 1.251 - 4.012% [350] {min=0.000, max=0.010, mean=0.004, var=0.000, std dev=0.002} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 148.090 - 474.793% [51160] {min=0.000, max=0.011, mean=0.003, var=0.000, std dev=0.002} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 2.500 - 8.014% | |-> 3.306 - 10.598% [10] {min=0.316, max=0.345, mean=0.331, var=0.000, std dev=0.009} Kokkos::parallel_reduce [HPX] ZL28CalcHourglassControlForElemsR6DomainPddEUliRiE_ | | |-> 1.065 - 3.413% [10] {min=0.000, max=0.110, mean=0.106, var=0.000, std dev=0.003} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 134.592 - 431.520% [1270] {min=0.101, max=0.132, mean=0.106, var=0.000, std dev=0.004} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | |-> 0.002 - 0.008% [10] {min=0.000, max=0.000, mean=0.000, var=-0.000, std dev=-nan} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.001 - 0.004% [470] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | Remainder: 0.001 - 0.004% | | Remainder: 2.239 - 7.177% | |-> 2.648 - 8.491% [110] {min=0.001, max=2.113, mean=0.024, var=0.040, std dev=0.200} Kokkos::parallel_for [HPX] EvalEOSForElems F | | |-> 0.162 - 0.518% [110] {min=0.000, max=0.004, mean=0.001, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 19.627 - 62.926% [14470] {min=0.000, max=0.008, mean=0.001, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 2.487 - 7.972% | |-> 2.303 - 7.383% [110] {min=0.001, max=2.175, mean=0.021, var=0.043, std dev=0.206} Kokkos::parallel_reduce [HPX] ZL27CalcHydroConstraintForElemsR6DomainiidRdEUliR9MinFinderE_ | | |-> 0.090 - 0.288% [110] {min=0.000, max=0.001, mean=0.001, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.514 - 1.647% [14470] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | |-> 0.023 - 0.074% [110] {min=0.000, max=0.000, mean=0.000, var=-0.000, std dev=-nan} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.010 - 0.033% [5170] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | Remainder: 0.013 - 0.041% | | Remainder: 2.190 - 7.021% | |-> 1.912 - 6.130% [127] {min=0.000, max=0.059, mean=0.015, var=0.000, std dev=0.006} Kokkos::parallel_for [HPX] Kokkos::View::initialization [] via memset | |-> 1.380 - 4.424% [10] {min=0.120, max=0.145, mean=0.138, var=0.000, std dev=0.007} Kokkos::parallel_for [HPX] CalcFBHourglassForceForElems A | | |-> 0.381 - 1.222% [10] {min=0.000, max=0.087, mean=0.038, var=0.000, std dev=0.018} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Real_t, Index_t, Index_t)::, {Kokkos::Experimental::HPX}>:: >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Real_t, Index_t, Index_t)::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 46.987 - 150.647% [1270] {min=0.018, max=0.106, mean=0.037, var=0.000, std dev=0.017} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Real_t, Index_t, Index_t)::, {Kokkos::Experimental::HPX}>:: >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Real_t, Index_t, Index_t)::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.999 - 3.202% | |-> 1.353 - 4.337% [2] {min=0.339, max=1.013, mean=0.676, var=0.114, std dev=0.337} Kokkos::parallel_for [HPX] Kokkos::View::initialization [Buffer] via memset | |-> 1.217 - 3.901% [110] {min=0.001, max=0.024, mean=0.011, var=0.000, std dev=0.007} Kokkos::parallel_for [HPX] CalcMonotonicQRegionForElems | | |-> 0.326 - 1.046% [110] {min=0.000, max=0.011, mean=0.003, var=0.000, std dev=0.002} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 47.154 - 151.182% [14470] {min=0.000, max=0.017, mean=0.003, var=0.000, std dev=0.003} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.890 - 2.855% | |-> 0.798 - 2.559% [10] {min=0.077, max=0.085, mean=0.080, var=0.000, std dev=0.002} Kokkos::parallel_for [HPX] CalcFBHourglassForceForElems B | | |-> 0.095 - 0.303% [10] {min=0.000, max=0.016, mean=0.009, var=0.000, std dev=0.003} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Real_t, Index_t, Index_t)::, {}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 25.824 - 82.795% [1290] {min=0.004, max=0.052, mean=0.020, var=0.000, std dev=0.011} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Kokkos::View >, Real_t, Index_t, Index_t)::, {}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.703 - 2.255% | |-> 0.775 - 2.485% [10] {min=0.064, max=0.083, mean=0.078, var=0.000, std dev=0.005} Kokkos::parallel_for [HPX] IntegrateStressForElems B | | |-> 0.082 - 0.264% [10] {min=0.000, max=0.016, mean=0.008, var=0.000, std dev=0.004} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 25.556 - 81.936% [1290] {min=0.004, max=0.052, mean=0.020, var=0.000, std dev=0.011} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.693 - 2.221% | |-> 0.727 - 2.330% [10] {min=0.063, max=0.083, mean=0.073, var=0.000, std dev=0.006} Kokkos::parallel_for [HPX] IntegrateStressForElems A | | |-> 0.214 - 0.687% [10] {min=0.000, max=0.028, mean=0.021, var=0.000, std dev=0.002} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 26.799 - 85.919% [1270] {min=0.016, max=0.047, mean=0.021, var=0.000, std dev=0.004} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.512 - 1.643% | |-> 0.511 - 1.640% [10] {min=0.046, max=0.061, mean=0.051, var=0.000, std dev=0.005} Kokkos::parallel_for [HPX] CalcKinematicsForElems | | |-> 0.198 - 0.636% [10] {min=0.000, max=0.038, mean=0.020, var=0.000, std dev=0.007} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 20.002 - 64.130% [1270] {min=0.013, max=0.031, mean=0.016, var=0.000, std dev=0.002} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.313 - 1.003% | |-> 0.392 - 1.258% [10] {min=0.030, max=0.050, mean=0.039, var=0.000, std dev=0.006} Kokkos::parallel_for [HPX] CalcMonotonicQGradientsForElems | | |-> 0.162 - 0.519% [10] {min=0.000, max=0.023, mean=0.016, var=0.000, std dev=0.004} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 15.193 - 48.709% [1270] {min=0.009, max=0.031, mean=0.012, var=0.000, std dev=0.003} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.231 - 0.739% | |-> 0.359 - 1.152% [110] {min=0.001, max=0.034, mean=0.003, var=0.000, std dev=0.003} Kokkos::parallel_for [HPX] CalcSoundSpeedForElems | | |-> 0.145 - 0.466% [110] {min=0.000, max=0.003, mean=0.001, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 10.355 - 33.199% [14470] {min=0.000, max=0.004, mean=0.001, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.214 - 0.686% | |-> 0.202 - 0.647% [10] {min=0.019, max=0.024, mean=0.020, var=0.000, std dev=0.001} Kokkos::parallel_for [HPX] Kokkos::View::initialization [vnewc] via memset | |-> 0.170 - 0.545% [110] {min=0.001, max=0.005, mean=0.002, var=0.000, std dev=0.001} Kokkos::parallel_reduce [HPX] ZL29CalcCourantConstraintForElemsR6DomainiidRdEUliR9MinFinderE_ | | |-> 0.114 - 0.367% [110] {min=0.000, max=0.004, mean=0.001, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 1.920 - 6.155% [14470] {min=0.000, max=0.004, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | |-> 0.024 - 0.076% [110] {min=0.000, max=0.000, mean=0.000, var=-0.000, std dev=-nan} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.011 - 0.034% [5170] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | Remainder: 0.013 - 0.042% | | Remainder: 0.032 - 0.102% | |-> 0.162 - 0.519% [10] {min=0.014, max=0.029, mean=0.016, var=0.000, std dev=0.004} Kokkos::parallel_for [HPX] Kokkos::View::initialization [sigxx] via memset | |-> 0.141 - 0.453% [10] {min=0.013, max=0.016, mean=0.014, var=0.000, std dev=0.001} Kokkos::parallel_for [HPX] Kokkos::View::initialization [sigyy] via memset | |-> 0.130 - 0.417% [10] {min=0.012, max=0.015, mean=0.013, var=0.000, std dev=0.001} Kokkos::parallel_for [HPX] Kokkos::View::initialization [sigzz] via memset | |-> 0.126 - 0.404% [10] {min=0.012, max=0.015, mean=0.013, var=0.000, std dev=0.001} Kokkos::parallel_for [HPX] Kokkos::View::initialization [determ] via memset | |-> 0.112 - 0.359% [10] {min=0.006, max=0.021, mean=0.011, var=0.000, std dev=0.004} Kokkos::parallel_for [HPX] CalcAccelerationForNodes | | |-> 0.045 - 0.143% [10] {min=0.000, max=0.015, mean=0.004, var=0.000, std dev=0.004} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 3.261 - 10.456% [1290] {min=0.001, max=0.020, mean=0.003, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.067 - 0.215% | |-> 0.104 - 0.333% [10] {min=0.005, max=0.014, mean=0.010, var=0.000, std dev=0.003} Kokkos::parallel_for [HPX] CalcPositionForNodes | | |-> 0.024 - 0.078% [10] {min=0.000, max=0.004, mean=0.002, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 3.631 - 11.640% [1290] {min=0.000, max=0.009, mean=0.003, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.079 - 0.254% | |-> 0.099 - 0.316% [10] {min=0.009, max=0.011, mean=0.010, var=0.000, std dev=0.001} Kokkos::parallel_for [HPX] InitStressTermsForElems | | |-> 0.056 - 0.179% [10] {min=0.000, max=0.008, mean=0.006, var=0.000, std dev=0.002} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 3.602 - 11.550% [1270] {min=0.000, max=0.009, mean=0.003, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.043 - 0.137% | |-> 0.085 - 0.273% [10] {min=0.008, max=0.010, mean=0.009, var=0.000, std dev=0.001} Kokkos::parallel_reduce [HPX] ZL20CalcLagrangeElementsR6DomainEUliRiE_ | | |-> 0.043 - 0.138% [10] {min=0.000, max=0.006, mean=0.004, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 2.957 - 9.479% [1270] {min=0.000, max=0.005, mean=0.002, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | |-> 0.003 - 0.008% [10] {min=0.000, max=0.000, mean=0.000, var=-0.000, std dev=-nan} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.001 - 0.005% [470] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | Remainder: 0.001 - 0.004% | | Remainder: 0.040 - 0.127% | |-> 0.084 - 0.270% [10] {min=0.006, max=0.010, mean=0.008, var=0.000, std dev=0.001} Kokkos::parallel_for [HPX] CalcVelocityForNodes | | |-> 0.024 - 0.078% [10] {min=0.000, max=0.003, mean=0.002, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 3.034 - 9.728% [1290] {min=0.000, max=0.006, mean=0.002, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.060 - 0.192% | |-> 0.074 - 0.238% [10] {min=0.007, max=0.008, mean=0.007, var=0.000, std dev=0.001} Kokkos::parallel_for [HPX] ApplyMaterialPropertiesForElems A | | |-> 0.045 - 0.144% [10] {min=0.000, max=0.007, mean=0.005, var=0.000, std dev=0.002} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 2.283 - 7.320% [1270] {min=0.000, max=0.006, mean=0.002, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.029 - 0.094% | |-> 0.061 - 0.194% [10] {min=0.006, max=0.007, mean=0.006, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] ApplyMaterialPropertiesForElems C | | |-> 0.030 - 0.097% [10] {min=0.000, max=0.004, mean=0.003, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 2.087 - 6.692% [1270] {min=0.000, max=0.005, mean=0.002, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.030 - 0.097% | |-> 0.059 - 0.188% [1] {min=0.059, max=0.059, mean=0.059, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] Kokkos::View::initialization [nodeElemCornerList] via memset | |-> 0.057 - 0.181% [10] {min=0.003, max=0.014, mean=0.006, var=0.000, std dev=0.003} Kokkos::parallel_for [HPX] CalcForceForNodes | | |-> 0.029 - 0.094% [10] {min=0.000, max=0.012, mean=0.003, var=0.000, std dev=0.003} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 1.585 - 5.083% [1290] {min=0.000, max=0.013, mean=0.001, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.027 - 0.088% | |-> 0.052 - 0.167% [10] {min=0.005, max=0.006, mean=0.005, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] ApplyMaterialPropertiesForElems B | | |-> 0.023 - 0.073% [10] {min=0.000, max=0.004, mean=0.002, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 1.748 - 5.604% [1270] {min=0.000, max=0.004, mean=0.001, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.029 - 0.094% | |-> 0.038 - 0.121% [13] {min=0.000, max=0.006, mean=0.003, var=0.000, std dev=0.001} Kokkos deep copy: Host Scalar -> Host | | |-> 0.037 - 0.120% [13] {min=0.000, max=0.006, mean=0.003, var=0.000, std dev=0.001} Kokkos::parallel_for [HPX] Kokkos::ViewFill-1D | | | |-> 0.017 - 0.056% [12] {min=0.000, max=0.002, mean=0.001, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, Kokkos::MemoryTraits<0> >, Kokkos::LayoutRight, Kokkos::Experimental::HPX, 1, int>, {Kokkos::Experimental::HPX, Kokkos::IndexType}>::, Kokkos::MemoryTraits<0> >, Kokkos::LayoutRight, Kokkos::Experimental::HPX, 1, int>, Kokkos::RangePolicy >, Kokkos::Experimental::HPX>::Member)>&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | | |-> 0.702 - 2.251% [1538] {min=0.000, max=0.002, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, Kokkos::MemoryTraits<0> >, Kokkos::LayoutRight, Kokkos::Experimental::HPX, 1, int>, {Kokkos::Experimental::HPX, Kokkos::IndexType}>::, Kokkos::MemoryTraits<0> >, Kokkos::LayoutRight, Kokkos::Experimental::HPX, 1, int>, Kokkos::RangePolicy >, Kokkos::Experimental::HPX>::Member)>&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.000 - 0.000% [1] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, Kokkos::MemoryTraits<0> >, Kokkos::LayoutRight, Kokkos::Experimental::HPX, 1, int>, {Kokkos::Experimental::HPX, Kokkos::IndexType}>::, Kokkos::MemoryTraits<0> >, Kokkos::LayoutRight, Kokkos::Experimental::HPX, 1, int>, Kokkos::RangePolicy >, Kokkos::Experimental::HPX>::Member)>&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | Remainder: 0.020 - 0.064% | | Remainder: 0.000 - 0.001% | |-> 0.037 - 0.119% [10] {min=0.002, max=0.006, mean=0.004, var=0.000, std dev=0.001} Kokkos::parallel_for [HPX] UpdateVolumesForElems | | |-> 0.017 - 0.055% [10] {min=0.000, max=0.003, mean=0.002, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 1.080 - 3.464% [1270] {min=0.000, max=0.004, mean=0.001, var=0.000, std dev=0.001} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.020 - 0.065% | |-> 0.024 - 0.077% [10] {min=0.002, max=0.006, mean=0.002, var=0.000, std dev=0.001} Kokkos::parallel_reduce [HPX] ZL31ApplyMaterialPropertiesForElemsR6DomainEUliRiE2_ | | |-> 0.012 - 0.038% [10] {min=0.000, max=0.002, mean=0.001, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.400 - 1.281% [1270] {min=0.000, max=0.005, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | |-> 0.002 - 0.007% [10] {min=0.000, max=0.000, mean=0.000, var=-0.000, std dev=-nan} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.001 - 0.004% [470] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | Remainder: 0.001 - 0.003% | | Remainder: 0.010 - 0.031% | |-> 0.021 - 0.066% [10] {min=0.002, max=0.004, mean=0.002, var=0.000, std dev=0.001} Kokkos::parallel_reduce [HPX] ZL23CalcVolumeForceForElemsR6DomainEUliRiE_ | | |-> 0.013 - 0.042% [10] {min=0.000, max=0.002, mean=0.001, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.293 - 0.938% [1270] {min=0.000, max=0.001, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | |-> 0.002 - 0.008% [10] {min=0.000, max=0.000, mean=0.000, var=-0.000, std dev=-nan} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.001 - 0.005% [470] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | Remainder: 0.001 - 0.003% | | Remainder: 0.005 - 0.017% | |-> 0.020 - 0.064% [10] {min=0.001, max=0.003, mean=0.002, var=0.000, std dev=0.000} Kokkos::parallel_reduce [HPX] ZL13CalcQForElemsR6DomainEUlRKiRiE_ | | |-> 0.012 - 0.039% [10] {min=0.000, max=0.002, mean=0.001, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.371 - 1.190% [1270] {min=0.000, max=0.001, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::InvalidType, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | |-> 0.002 - 0.007% [10] {min=0.000, max=0.000, mean=0.000, var=-0.000, std dev=-nan} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.006 - 0.019% [470] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelReduce, ReducerType, Kokkos::Experimental::HPX>::execute_task, Kokkos::InvalidType, {Kokkos::Experimental::HPX}>::&, int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.006 - 0.018% | |-> 0.009 - 0.027% [1] {min=0.009, max=0.009, mean=0.009, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] Kokkos::View::initialization [m_nodeElemStart] via memset | |-> 0.008 - 0.026% [1] {min=0.008, max=0.008, mean=0.008, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] Kokkos::View::initialization [nodeElemCount] via memset | |-> 0.007 - 0.024% [1] {min=0.007, max=0.007, mean=0.007, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] Kokkos::View::initialization [regElemlist::entries] via memset | |-> 0.007 - 0.022% [10] {min=0.001, max=0.001, mean=0.001, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] ApplyAccelerationBoundaryConditionsForNodes C | | |-> 0.006 - 0.018% [10] {min=0.000, max=0.001, mean=0.001, var=-0.000, std dev=-nan} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.018 - 0.057% [1290] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.001 - 0.003% | |-> 0.007 - 0.022% [10] {min=0.001, max=0.001, mean=0.001, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] ApplyAccelerationBoundaryConditionsForNodes B | | |-> 0.006 - 0.019% [10] {min=0.000, max=0.001, mean=0.001, var=-0.000, std dev=-nan} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.022 - 0.071% [1290] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.001 - 0.003% | |-> 0.007 - 0.021% [10] {min=0.001, max=0.001, mean=0.001, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] ApplyAccelerationBoundaryConditionsForNodes A | | |-> 0.006 - 0.019% [10] {min=0.000, max=0.001, mean=0.001, var=-0.000, std dev=-nan} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | | |-> 0.019 - 0.062% [1290] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} decltype(auto) hpx::execution::parallel_policy_executor::bulk_async_execute(F&&, const S&, Ts&& ...) const [with F = hpx::parallel::util::detail::partitioner_iteration, hpx::execution::static_chunk_size>, Kokkos::Impl::ParallelFor, Kokkos::Experimental::HPX>::execute_task, {Kokkos::Experimental::HPX}>::, Kokkos::RangePolicy, Kokkos::Experimental::HPX>::Member)>&, long unsigned int, hpx::tuple<> > >; S = hpx::util::iterator_range, hpx::parallel::util::detail::chunk_size_idx_iterator >; Ts = {}; Policy = hpx::launch] | | Remainder: 0.001 - 0.002% | |-> 0.001 - 0.002% [1] {min=0.001, max=0.001, mean=0.001, var=0.000, std dev=0.000} run_helper | |-> 0.000 - 0.001% [126] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] Kokkos::ViewCopy-1D | |-> 0.000 - 0.000% [35] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} Kokkos deep copy: Host -> Host | |-> 0.000 - 0.000% [1] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} parallel_policy_executor::post | |-> 0.000 - 0.000% [1] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] Kokkos::ViewCopy-2D | |-> 0.000 - 0.000% [1] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} Kokkos deep copy: Host nodeElemCornerList -> Host nodeElemCornerList | |-> 0.000 - 0.000% [1] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} Kokkos deep copy: Host regElemlist::entries -> Host regElemlist::entries | |-> 0.000 - 0.000% [1] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] Kokkos::View::initialization [regElemlist::row_map] via memset | |-> 0.000 - 0.000% [1] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} Kokkos::parallel_for [HPX] Kokkos::View::initialization [regBinEnd] via memset | |-> 0.000 - 0.000% [1] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} Kokkos deep copy: Host m_nodeElemStart -> Host m_nodeElemStart | |-> 0.000 - 0.000% [1] {min=0.000, max=0.000, mean=0.000, var=0.000, std dev=0.000} Kokkos deep copy: Host regElemlist::row_map -> Host regElemlist::row_map | Remainder: 1.552 - 4.976%