ID | Module | Source Location | Source Function | Level | Max Time Over Threads (s) | Time w.r.t. Wall Time (s) | Coverage (% app. time) | Speedup if no scalar integer | Speedup if FP arith vectorized | Speedup if fully vectorized | Speedup if FP only | Number of paths | Vectorization Ratio (%) | Vector Length Use (%) | Flops (GFLOP/s) | CQA cycles | CQA cycles if no scalar integer | CQA cycles if FP arith vectorized | CQA cycles if fully vectorized | CQA cycles if FP only |
○Loop 1092 | exec | viscosity_kernel.f90-pp.f90:56-89 | __nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_ | Innermost | 3.02 | 3.02 | 13.32 | 1.01 | 1.00 | 1.01 | 1.41 | 1 | 92.00 | 95.00 | 0.00 | 39.50 | 39.00 | 39.50 | 39.13 | 28.00 |
○Loop 571 | exec | calc_dt_kernel.f90-pp.f90:126-126 | __nv_calc_dt_kernel_module_calc_dt_kernel__F1L89_1_ | Outermost | 2.56 | 2.56 | 11.29 | NA | NA | NA | NA | NA | NA | NA | 0.00 | NA | NA | NA | NA | NA |
○Loop 540 | exec | advec_mom_kernel.f90-pp.f90:215-215,advec_mom_kernel.f90-pp.f90:227-241 | advec_mom_kernel | Innermost | 1.59 | 1.59 | 7.03 | 2.30 | 1.00 | 4.49 - 7.22 | 1.84 | 2 | 0.00 | 22.47 | 0.00 | 5.75 | 2.50 | 5.75 | 1.28 - 0.80 | 3.13 |
○Loop 606 | exec | ideal_gas_kernel.f90-pp.f90:50-55 | __nv_ideal_gas_kernel_module_ideal_gas_kernel__F1L45_1_ | Innermost | 1.52 | 1.52 | 6.72 | 1.00 | 1.00 | 1.00 | 1.13 | 1 | 92.31 | 100.00 | 0.00 | 4.50 | 4.50 | 4.50 | 4.50 | 4.00 |
○Loop 522 | exec | advec_cell_kernel.f90-pp.f90:202-204,advec_cell_kernel.f90-pp.f90:210-210,advec_cell_kernel.f90-pp.f90:216-249 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Single | 1.28 | 1.28 | 5.64 | 3.50 | 1.00 | 7.28 | 2.00 | 1 | 0.00 | 20.00 | 0.00 | 14.00 | 4.00 | 14.00 | 1.92 | 7.00 |
○Loop 49 | exec | PdV_kernel.f90-pp.f90:77-87,PdV_kernel.f90-pp.f90:93-99 | __nv_pdv_kernel_module_pdv_kernel__F1L67_1_ | Innermost | 1.18 | 1.18 | 5.18 | 1.00 | 1.00 | 1.00 | 1.00 | 1 | 100.00 | 100.00 | 0.00 | 16.50 | 16.50 | 16.50 | 16.50 | 16.50 |
○Loop 545 | exec | advec_mom_kernel.f90-pp.f90:152-177 | advec_mom_kernel | Innermost | 1.17 | 1.17 | 5.16 | 2.26 | 1.00 | 4.37 - 6.96 | 1.81 | 4 | 0.00 | 22.25 | 0.00 | 5.66 | 2.50 | 5.66 | 1.29 - 0.81 | 3.13 |
○Loop 523 | exec | advec_cell_kernel.f90-pp.f90:112-149,advec_cell_kernel.f90-pp.f90:155-158 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Single | 1.14 | 1.14 | 5.03 | 3.50 | 1.00 | 6.89 | 2.00 | 1 | 0.00 | 21.55 | 0.00 | 14.00 | 4.00 | 14.00 | 2.03 | 7.00 |
○Loop 52 | exec | PdV_kernel.f90-pp.f90:113-123,PdV_kernel.f90-pp.f90:129-135 | __nv_pdv_kernel_module_pdv_kernel__F1L67_1_ | Innermost | 1.12 | 1.12 | 4.92 | 1.00 | 1.00 | 1.00 | 1.00 | 1 | 95.24 | 96.43 | 0.00 | 16.50 | 16.50 | 16.50 | 16.50 | 16.50 |
○Loop 572 | exec | calc_dt_kernel.f90-pp.f90:96-132 | __nv_calc_dt_kernel_module_calc_dt_kernel__F1L89_1_ | Innermost | 0.93 | 0.93 | 4.08 | 2.73 | 1.84 | 3.64 - 6.53 | 1.82 - 1.96 | 1 | 31.82 | 31.82 | 0.00 | 12.75 | 4.67 | 6.94 | 3.50 - 1.95 | 7.00 - 6.50 |
○Loop 515 | exec | accelerate_kernel.f90-pp.f90:63-63,accelerate_kernel.f90-pp.f90:69-75 | __nv_accelerate_kernel_module_accelerate_kernel__F1L57_1_ | Innermost | 0.8 | 0.8 | 3.53 | 1.00 | 1.00 | 1.00 | 1.04 | 1 | 98.08 | 100.00 | 0.00 | 14.00 | 14.00 | 14.00 | 14.00 | 13.50 |
○Loop 518 | exec | advec_cell_kernel.f90-pp.f90:256-261 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.6 | 0.6 | 2.67 | 1.00 | 1.00 | 1.00 | 1.22 | 1 | 100.00 | 100.00 | 0.00 | 5.50 | 5.50 | 5.50 | 5.50 | 4.50 |
○Loop 521 | exec | advec_cell_kernel.f90-pp.f90:165-170 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.57 | 0.57 | 2.51 | 1.00 | 1.00 | 1.00 | 1.22 | 1 | 100.00 | 100.00 | 0.00 | 5.50 | 5.50 | 5.50 | 5.50 | 4.50 |
○Loop 538 | exec | advec_mom_kernel.f90-pp.f90:248-248 | advec_mom_kernel | Innermost | 0.56 | 0.56 | 2.49 | 1.00 | 1.00 | 1.00 | 2.00 | 1 | 100.00 | 100.00 | 0.00 | 6.00 | 6.00 | 6.00 | 6.00 | 3.00 |
○Loop 543 | exec | advec_mom_kernel.f90-pp.f90:184-184 | advec_mom_kernel | Innermost | 0.54 | 0.54 | 2.38 | 1.00 | 1.00 | 1.00 | 2.00 | 1 | 100.00 | 100.00 | 0.00 | 6.00 | 6.00 | 6.00 | 6.00 | 3.00 |
○Loop 584 | exec | flux_calc_kernel.f90-pp.f90:57-59 | __nv_flux_calc_kernel_module_flux_calc_kernel__F1L49_1_ | Innermost | 0.49 | 0.49 | 2.18 | 1.00 | 1.00 | 1.00 | 1.20 | 1 | 100.00 | 100.00 | 0.00 | 6.00 | 6.00 | 6.00 | 6.00 | 5.00 |
○Loop 551 | exec | advec_mom_kernel.f90-pp.f90:204-208 | advec_mom_kernel | Innermost | 0.39 | 0.39 | 1.72 | 1.00 | 1.00 | 1.00 | 1.50 | 1 | 100.00 | 100.00 | 0.00 | 6.00 | 6.00 | 6.00 | 6.00 | 4.00 |
○Loop 548 | exec | advec_mom_kernel.f90-pp.f90:140-144 | advec_mom_kernel | Innermost | 0.34 | 0.34 | 1.48 | 1.00 | 1.00 | 1.00 | 1.50 | 1 | 100.00 | 100.00 | 0.00 | 6.00 | 6.00 | 6.00 | 6.00 | 4.00 |
○Loop 569 | exec | advec_mom_kernel.f90-pp.f90:86-87 | advec_mom_kernel | Innermost | 0.32 | 0.32 | 1.43 | 1.00 | 1.00 | 1.00 | 1.75 | 1 | 100.00 | 100.00 | 0.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.00 |
○Loop 566 | exec | advec_mom_kernel.f90-pp.f90:96-97 | advec_mom_kernel | Innermost | 0.29 | 0.29 | 1.3 | 1.00 | 1.00 | 1.00 | 1.75 | 1 | 100.00 | 100.00 | 0.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.00 |
○Loop 695 | exec | reset_field_kernel.f90-pp.f90:52-53 | __nv_reset_field_kernel_module_reset_field_kernel__F1L47_1_ | Innermost | 0.25 | 0.25 | 1.1 | 1.00 | 1.00 | 1.00 | 4.00 | 1 | 100.00 | 100.00 | 0.00 | 4.00 | 4.00 | 4.00 | 4.00 | 1.00 |
○Loop 698 | exec | revert_kernel.f90-pp.f90:47-48 | __nv_revert_kernel_module_revert_kernel__F1L41_1_ | Innermost | 0.25 | 0.25 | 1.1 | 1.00 | 1.00 | 1.00 | 4.00 | 1 | 100.00 | 100.00 | 0.00 | 4.00 | 4.00 | 4.00 | 4.00 | 1.00 |
○Loop 563 | exec | advec_mom_kernel.f90-pp.f90:106-107 | advec_mom_kernel | Innermost | 0.21 | 0.21 | 0.93 | 1.00 | 1.00 | 1.00 | 2.50 | 1 | 100.00 | 100.00 | 0.00 | 2.50 | 2.50 | 2.50 | 2.50 | 1.00 |
○Loop 560 | exec | advec_mom_kernel.f90-pp.f90:116-117 | advec_mom_kernel | Innermost | 0.21 | 0.21 | 0.93 | 1.00 | 1.00 | 1.00 | 2.50 | 1 | 100.00 | 100.00 | 0.00 | 2.50 | 2.50 | 2.50 | 2.50 | 1.00 |
○Loop 692 | exec | reset_field_kernel.f90-pp.f90:62-63 | __nv_reset_field_kernel_module_reset_field_kernel__F1L47_1_ | Innermost | 0.2 | 0.2 | 0.9 | 1.00 | 1.00 | 1.00 | 4.00 | 1 | 100.00 | 100.00 | 0.00 | 4.00 | 4.00 | 4.00 | 4.00 | 1.00 |
○Loop 535 | exec | advec_cell_kernel.f90-pp.f90:90-91 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.14 | 0.14 | 0.64 | 1.00 | 1.00 | 1.00 | 1.40 | 1 | 100.00 | 100.00 | 0.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.50 |
○Loop 529 | exec | advec_cell_kernel.f90-pp.f90:182-183 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.14 | 0.14 | 0.64 | 1.00 | 1.00 | 1.00 | 1.40 | 1 | 100.00 | 100.00 | 0.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.50 |
○Loop 554 | exec | advec_mom_kernel.f90-pp.f90:195-195 | advec_mom_kernel | Innermost | 0.13 | 0.13 | 0.6 | 1.00 | 1.00 | 1.00 | 1.25 | 1 | 100.00 | 100.00 | 0.00 | 5.00 | 5.00 | 5.00 | 5.00 | 4.00 |
○Loop 532 | exec | advec_cell_kernel.f90-pp.f90:192-193 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.11 | 0.11 | 0.49 | 1.00 | 1.00 | 1.00 | 2.50 | 1 | 100.00 | 100.00 | 0.00 | 2.50 | 2.50 | 2.50 | 2.50 | 1.00 |
○Loop 557 | exec | advec_mom_kernel.f90-pp.f90:130-130 | advec_mom_kernel | Innermost | 0.1 | 0.1 | 0.46 | 1.00 | 1.00 | 1.00 | 1.25 | 1 | 100.00 | 100.00 | 0.00 | 5.00 | 5.00 | 5.00 | 5.00 | 4.00 |
○Loop 526 | exec | advec_cell_kernel.f90-pp.f90:100-101 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.1 | 0.1 | 0.44 | 1.00 | 1.00 | 1.00 | 2.50 | 1 | 100.00 | 100.00 | 0.00 | 2.50 | 2.50 | 2.50 | 2.50 | 1.00 |
○Loop 573 | exec | field_summary_kernel.f90-pp.f90:62-71 | __nv_field_summary_kernel_module_field_summary_kernel__F1L54_1_ | Innermost | 0.07 | 0.07 | 0.33 | 1.00 | 1.00 | 1.00 | 1.00 | 1 | 94.44 | 97.92 | 0.00 | 11.50 | 11.50 | 11.50 | 11.50 | 11.50 |
○Loop 21 | exec | build_field.f90-pp.f90:104-116 | __nv_build_field__F1L100_1_ | Innermost | 0.05 | 0.05 | 0.22 | 1.00 | 1.00 | 8.00 | 1.01 | 1 | 0.00 | 16.67 | 0.00 | 22.17 | 22.17 | 22.17 | 2.77 | 22.00 |
○Loop 19 | exec | build_field.f90-pp.f90:123-131 | __nv_build_field__F1L100_1_ | Innermost | 0.04 | 0.04 | 0.18 | 1.00 | 1.00 | 8.00 | 1.00 | 1 | 0.00 | 16.67 | 0.00 | 16.00 | 16.00 | 16.00 | 2.00 | 16.00 |
○Loop 888 | exec | update_halo_kernel.f90-pp.f90:168-169 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0.02 | 0.02 | 0.09 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | 0.00 | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 793 | exec | update_halo_kernel.f90-pp.f90:473-474 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0.02 | 0.02 | 0.09 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | 0.00 | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 763 | exec | update_halo_kernel.f90-pp.f90:559-560 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0.01 | 0.01 | 0.07 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | 0.00 | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 734 | exec | update_halo_kernel.f90-pp.f90:649-650 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0.01 | 0.01 | 0.07 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | 0.00 | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 17 | exec | build_field.f90-pp.f90:138-141 | __nv_build_field__F1L100_1_ | Innermost | 0.01 | 0.01 | 0.07 | 1.00 | 1.00 | 8.00 | 1.03 | 1 | 0.00 | 16.67 | 0.00 | 6.17 | 6.17 | 6.17 | 0.77 | 6.00 |
○Loop 541 | exec | advec_mom_kernel.f90-pp.f90:183-186 | advec_mom_kernel | Outermost | 0.01 | 0.01 | 0.07 | 1.00 | 1.00 | 4.96 | 3.15 | 3 | 0.00 | 21.09 | 0.00 | 3.50 | 3.50 | 3.50 | 0.71 | 1.11 |
○Loop 15 | exec | build_field.f90-pp.f90:147-150 | __nv_build_field__F1L100_1_ | Innermost | 0.01 | 0.01 | 0.07 | 1.00 | 1.00 | 8.00 | 1.03 | 1 | 0.00 | 16.67 | 0.00 | 6.17 | 6.17 | 6.17 | 0.77 | 6.00 |
○Loop 789 | exec | update_halo_kernel.f90-pp.f90:483-484 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0.01 | 0.01 | 0.04 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | 0.00 | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 583 | exec | flux_calc_kernel.f90-pp.f90:54-56,flux_calc_kernel.f90-pp.f90:61-62 | __nv_flux_calc_kernel_module_flux_calc_kernel__F1L49_1_ | Outermost | 0.01 | 0.01 | 0.04 | 1.00 | 1.00 | 4.39 | 7.00 | 2 | 0.00 | 24.26 | 0.00 | 7.00 | 7.00 | 7.00 | 1.59 | 1.00 |
○Loop 886 | exec | update_halo_kernel.f90-pp.f90:167-170 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | InBetween | 0 | 0 | 0.02 | 1.00 | 1.00 | 5.45 | 3.75 | 1 | 0.00 | 21.25 | NA | 3.75 | 3.75 | 3.75 | 0.69 | 1.00 |
○Loop 862 | exec | update_halo_kernel.f90-pp.f90:254-255 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 778 | exec | update_halo_kernel.f90-pp.f90:516-517 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 774 | exec | update_halo_kernel.f90-pp.f90:526-527 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 764 | exec | update_halo_kernel.f90-pp.f90:548-551 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | InBetween | 0 | 0 | 0.02 | 1.00 | 1.00 | 1.82 | 2.50 | 1 | 7.14 | 28.57 | NA | 5.00 | 5.00 | 5.00 | 2.75 | 2.00 |
○Loop 759 | exec | update_halo_kernel.f90-pp.f90:569-570 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 748 | exec | update_halo_kernel.f90-pp.f90:606-607 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 600 | exec | generate_chunk_kernel.f90-pp.f90:98-98 | __nv_generate_chunk_kernel_module_generate_chunk_kernel__F1L85_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 1.00 | 1.00 | 1 | 100.00 | 100.00 | NA | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 |
○Loop 549 | exec | advec_mom_kernel.f90-pp.f90:204-209 | advec_mom_kernel | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 2.67 | 1.78 | 1 | 50.00 | 35.42 | NA | 2.67 | 2.67 | 2.67 | 1.00 | 1.50 |
○Loop 546 | exec | advec_mom_kernel.f90-pp.f90:138-138,advec_mom_kernel.f90-pp.f90:144-146 | advec_mom_kernel | Outermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.96 | 5.44 | 1 | 0.00 | 23.21 | NA | 12.25 | 12.25 | 12.25 | 2.47 | 2.25 |
○Loop 591 | exec | generate_chunk_kernel.f90-pp.f90:130-137,generate_chunk_kernel.f90-pp.f90:166-166 | __nv_generate_chunk_kernel_module_generate_chunk_kernel__F1L85_1_ | Innermost | 0 | 0 | 0.02 | 1.48 | 1.00 | 4.61 | 5.67 | 5 | 21.05 | 28.95 | NA | 11.33 | 7.67 | 11.33 | 2.46 | 2.00 |
○Loop 513 | exec | accelerate_kernel.f90-pp.f90:63-63,accelerate_kernel.f90-pp.f90:69-77 | __nv_accelerate_kernel_module_accelerate_kernel__F1L57_1_ | Innermost | 0 | 0 | 0.02 | 1.45 | 1.00 | 3.63 | 1.07 | 1 | 52.94 | 36.76 | NA | 7.25 | 5.00 | 7.25 | 2.00 | 6.75 |