ID | Module | Source Location | Source Function | Level | Max Time Over Threads (s) | Time w.r.t. Wall Time (s) | Coverage (% app. time) | Speedup if no scalar integer | Speedup if FP arith vectorized | Speedup if fully vectorized | Speedup if FP only | Number of paths | Vectorization Ratio (%) | Vector Length Use (%) | Flops (GFLOP/s) | CQA cycles | CQA cycles if no scalar integer | CQA cycles if FP arith vectorized | CQA cycles if fully vectorized | CQA cycles if FP only |
○Loop 1097 | exec | viscosity_kernel.f90-pp.f90:56-89 | __nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_ | Innermost | 2.32 | 2.32 | 11.51 | 1.01 | 1.00 | 1.01 | 1.25 | 1 | 94.25 | 98.28 | 0.00 | 35.00 | 34.50 | 35.00 | 34.63 | 28.00 |
○Loop 576 | exec | calc_dt_kernel.f90-pp.f90:107-131 | __nv_calc_dt_kernel_module_calc_dt_kernel__F1L89_1_ | Innermost | 2.29 | 2.29 | 11.36 | 1.22 | 1.95 | 3.00 - 5.92 | 1.22 | 2 | 38.89 | 33.33 | 0.00 | 9.75 | 8.00 | 5.01 | 3.25 - 1.65 | 8.00 |
○Loop 610 | exec | ideal_gas_kernel.f90-pp.f90:50-55 | __nv_ideal_gas_kernel_module_ideal_gas_kernel__F1L45_1_ | Innermost | 1.56 | 1.56 | 7.76 | 1.00 | 1.00 | 1.00 | 1.13 | 1 | 92.31 | 100.00 | 0.00 | 4.50 | 4.50 | 4.50 | 4.50 | 4.00 |
○Loop 544 | exec | advec_mom_kernel.f90-pp.f90:215-215,advec_mom_kernel.f90-pp.f90:227-241 | advec_mom_kernel | Innermost | 1.55 | 1.55 | 7.71 | 2.20 | 1.00 | 5.33 - 7.04 | 1.83 | 2 | 0.00 | 22.47 | 0.00 | 5.50 | 2.50 | 5.50 | 1.03 - 0.78 | 3.00 |
○Loop 523 | exec | advec_cell_kernel.f90-pp.f90:202-204,advec_cell_kernel.f90-pp.f90:210-210,advec_cell_kernel.f90-pp.f90:216-249 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Single | 1.22 | 1.22 | 6.08 | 3.28 | 1.00 | 7.12 | 1.94 | 1 | 0.00 | 20.00 | 0.00 | 13.13 | 4.00 | 13.13 | 1.84 | 6.75 |
○Loop 552 | exec | advec_mom_kernel.f90-pp.f90:152-177 | advec_mom_kernel | Innermost | 1.19 | 1.19 | 5.9 | 2.16 | 1.00 | 5.18 - 6.78 | 1.80 | 4 | 0.00 | 22.25 | 0.00 | 5.41 | 2.50 | 5.41 | 1.04 - 0.80 | 3.00 |
○Loop 527 | exec | advec_cell_kernel.f90-pp.f90:112-149,advec_cell_kernel.f90-pp.f90:155-158 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Single | 1.09 | 1.09 | 5.38 | 3.31 | 1.00 | 6.78 | 1.96 | 1 | 0.00 | 21.55 | 0.00 | 13.25 | 4.00 | 13.25 | 1.95 | 6.75 |
○Loop 49 | exec | PdV_kernel.f90-pp.f90:111-123,PdV_kernel.f90-pp.f90:131-135 | __nv_pdv_kernel_module_pdv_kernel__F1L67_1_ | Innermost | 0.91 | 0.91 | 4.51 | 1.00 | 1.00 | 1.00 | 1.08 | 1 | 96.30 | 100.00 | 0.00 | 13.50 | 13.50 | 13.50 | 13.50 | 12.50 |
○Loop 519 | exec | accelerate_kernel.f90-pp.f90:63-63,accelerate_kernel.f90-pp.f90:69-75 | __nv_accelerate_kernel_module_accelerate_kernel__F1L57_1_ | Innermost | 0.82 | 0.82 | 4.09 | 1.00 | 1.00 | 1.00 | 1.04 | 1 | 97.96 | 100.00 | 0.00 | 12.50 | 12.50 | 12.50 | 12.50 | 12.00 |
○Loop 52 | exec | PdV_kernel.f90-pp.f90:77-87,PdV_kernel.f90-pp.f90:95-99 | __nv_pdv_kernel_module_pdv_kernel__F1L67_1_ | Innermost | 0.75 | 0.75 | 3.75 | 1.00 | 1.00 | 1.00 | 1.19 | 1 | 97.22 | 100.00 | 0.00 | 9.50 | 9.50 | 9.50 | 9.50 | 8.00 |
○Loop 522 | exec | advec_cell_kernel.f90-pp.f90:256-261 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.62 | 0.62 | 3.08 | 1.00 | 1.00 | 1.00 | 1.22 | 1 | 100.00 | 100.00 | 0.00 | 5.50 | 5.50 | 5.50 | 5.50 | 4.50 |
○Loop 526 | exec | advec_cell_kernel.f90-pp.f90:165-170 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.61 | 0.61 | 3.03 | 1.00 | 1.00 | 1.00 | 1.22 | 1 | 100.00 | 100.00 | 0.00 | 5.50 | 5.50 | 5.50 | 5.50 | 4.50 |
○Loop 542 | exec | advec_mom_kernel.f90-pp.f90:248-248 | advec_mom_kernel | Innermost | 0.54 | 0.54 | 2.7 | 1.00 | 1.00 | 1.00 | 2.00 | 1 | 100.00 | 100.00 | 0.00 | 6.00 | 6.00 | 6.00 | 6.00 | 3.00 |
○Loop 550 | exec | advec_mom_kernel.f90-pp.f90:184-184 | advec_mom_kernel | Innermost | 0.54 | 0.54 | 2.68 | 1.00 | 1.00 | 1.00 | 2.00 | 1 | 100.00 | 100.00 | 0.00 | 6.00 | 6.00 | 6.00 | 6.00 | 3.00 |
○Loop 588 | exec | flux_calc_kernel.f90-pp.f90:57-59 | __nv_flux_calc_kernel_module_flux_calc_kernel__F1L49_1_ | Innermost | 0.49 | 0.49 | 2.46 | 1.00 | 1.00 | 1.00 | 1.20 | 1 | 100.00 | 100.00 | 0.00 | 6.00 | 6.00 | 6.00 | 6.00 | 5.00 |
○Loop 547 | exec | advec_mom_kernel.f90-pp.f90:204-208 | advec_mom_kernel | Innermost | 0.41 | 0.41 | 2.03 | 1.00 | 1.00 | 1.00 | 1.71 | 1 | 100.00 | 100.00 | 0.00 | 6.00 | 6.00 | 6.00 | 6.00 | 3.50 |
○Loop 555 | exec | advec_mom_kernel.f90-pp.f90:140-144 | advec_mom_kernel | Innermost | 0.3 | 0.3 | 1.49 | 1.00 | 1.00 | 1.00 | 1.71 | 1 | 100.00 | 100.00 | 0.00 | 6.00 | 6.00 | 6.00 | 6.00 | 3.50 |
○Loop 570 | exec | advec_mom_kernel.f90-pp.f90:96-97 | advec_mom_kernel | Innermost | 0.29 | 0.29 | 1.44 | 1.00 | 1.00 | 1.00 | 1.75 | 1 | 100.00 | 100.00 | 0.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.00 |
○Loop 573 | exec | advec_mom_kernel.f90-pp.f90:86-87 | advec_mom_kernel | Innermost | 0.27 | 0.27 | 1.34 | 1.00 | 1.00 | 1.00 | 1.75 | 1 | 100.00 | 100.00 | 0.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.00 |
○Loop 699 | exec | reset_field_kernel.f90-pp.f90:52-53 | __nv_reset_field_kernel_module_reset_field_kernel__F1L47_1_ | Innermost | 0.25 | 0.25 | 1.26 | 1.00 | 1.00 | 1.00 | 4.00 | 1 | 100.00 | 100.00 | 0.00 | 4.00 | 4.00 | 4.00 | 4.00 | 1.00 |
○Loop 564 | exec | advec_mom_kernel.f90-pp.f90:116-117 | advec_mom_kernel | Innermost | 0.24 | 0.24 | 1.22 | 1.00 | 1.00 | 1.00 | 2.50 | 1 | 100.00 | 100.00 | 0.00 | 2.50 | 2.50 | 2.50 | 2.50 | 1.00 |
○Loop 702 | exec | revert_kernel.f90-pp.f90:47-48 | __nv_revert_kernel_module_revert_kernel__F1L41_1_ | Innermost | 0.24 | 0.24 | 1.19 | 1.00 | 1.00 | 1.00 | 4.00 | 1 | 100.00 | 100.00 | 0.00 | 4.00 | 4.00 | 4.00 | 4.00 | 1.00 |
○Loop 567 | exec | advec_mom_kernel.f90-pp.f90:106-107 | advec_mom_kernel | Innermost | 0.21 | 0.21 | 1.07 | 1.00 | 1.00 | 1.00 | 2.50 | 1 | 100.00 | 100.00 | 0.00 | 2.50 | 2.50 | 2.50 | 2.50 | 1.00 |
○Loop 696 | exec | reset_field_kernel.f90-pp.f90:62-63 | __nv_reset_field_kernel_module_reset_field_kernel__F1L47_1_ | Innermost | 0.19 | 0.19 | 0.97 | 1.00 | 1.00 | 1.00 | 4.00 | 1 | 100.00 | 100.00 | 0.00 | 4.00 | 4.00 | 4.00 | 4.00 | 1.00 |
○Loop 539 | exec | advec_cell_kernel.f90-pp.f90:90-91 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.16 | 0.16 | 0.79 | 1.00 | 1.00 | 1.00 | 1.17 | 1 | 100.00 | 100.00 | 0.00 | 3.50 | 3.50 | 3.50 | 3.50 | 3.00 |
○Loop 530 | exec | advec_cell_kernel.f90-pp.f90:182-183 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.16 | 0.16 | 0.79 | 1.00 | 1.00 | 1.00 | 1.17 | 1 | 100.00 | 100.00 | 0.00 | 3.50 | 3.50 | 3.50 | 3.50 | 3.00 |
○Loop 558 | exec | advec_mom_kernel.f90-pp.f90:130-130 | advec_mom_kernel | Innermost | 0.14 | 0.14 | 0.69 | 1.00 | 1.00 | 1.00 | 1.25 | 1 | 100.00 | 100.00 | 0.00 | 5.00 | 5.00 | 5.00 | 5.00 | 4.00 |
○Loop 561 | exec | advec_mom_kernel.f90-pp.f90:195-195 | advec_mom_kernel | Innermost | 0.13 | 0.13 | 0.64 | 1.00 | 1.00 | 1.00 | 1.25 | 1 | 100.00 | 100.00 | 0.00 | 5.00 | 5.00 | 5.00 | 5.00 | 4.00 |
○Loop 533 | exec | advec_cell_kernel.f90-pp.f90:192-193 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.12 | 0.12 | 0.6 | 1.00 | 1.00 | 1.00 | 2.50 | 1 | 100.00 | 100.00 | 0.00 | 2.50 | 2.50 | 2.50 | 2.50 | 1.00 |
○Loop 536 | exec | advec_cell_kernel.f90-pp.f90:100-101 | __nv_advec_cell_kernel_module_advec_cell_kernel__F1L81_1_ | Innermost | 0.09 | 0.09 | 0.47 | 1.00 | 1.00 | 1.00 | 2.50 | 1 | 100.00 | 100.00 | 0.00 | 2.50 | 2.50 | 2.50 | 2.50 | 1.00 |
○Loop 21 | exec | build_field.f90-pp.f90:104-116 | __nv_build_field__F1L100_1_ | Innermost | 0.06 | 0.06 | 0.3 | 1.00 | 1.00 | 8.00 | 1.01 | 1 | 0.00 | 16.67 | 0.00 | 22.17 | 22.17 | 22.17 | 2.77 | 22.00 |
○Loop 19 | exec | build_field.f90-pp.f90:123-131 | __nv_build_field__F1L100_1_ | Innermost | 0.06 | 0.06 | 0.3 | 1.00 | 1.00 | 8.00 | 1.00 | 1 | 0.00 | 16.67 | 0.00 | 16.00 | 16.00 | 16.00 | 2.00 | 16.00 |
○Loop 577 | exec | field_summary_kernel.f90-pp.f90:62-71 | __nv_field_summary_kernel_module_field_summary_kernel__F1L54_1_ | Innermost | 0.05 | 0.05 | 0.25 | 1.00 | 1.00 | 1.00 | 1.00 | 1 | 100.00 | 100.00 | 0.00 | 7.50 | 7.50 | 7.50 | 7.50 | 7.50 |
○Loop 17 | exec | build_field.f90-pp.f90:138-141 | __nv_build_field__F1L100_1_ | Innermost | 0.02 | 0.02 | 0.12 | 1.00 | 1.00 | 8.00 | 1.03 | 1 | 0.00 | 16.67 | 0.00 | 6.17 | 6.17 | 6.17 | 0.77 | 6.00 |
○Loop 887 | exec | update_halo_kernel.f90-pp.f90:178-179 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Single | 0.01 | 0.01 | 0.07 | 1.31 | 1.00 | 5.25 | 1.75 | 1 | 0.00 | 22.92 | 0.00 | 1.75 | 1.33 | 1.75 | 0.33 | 1.00 |
○Loop 734 | exec | update_halo_kernel.f90-pp.f90:659-660 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Single | 0.01 | 0.01 | 0.07 | 1.31 | 1.00 | 5.25 | 1.75 | 1 | 0.00 | 22.92 | 0.00 | 1.75 | 1.33 | 1.75 | 0.33 | 1.00 |
○Loop 15 | exec | build_field.f90-pp.f90:147-150 | __nv_build_field__F1L100_1_ | Innermost | 0.01 | 0.01 | 0.07 | 1.00 | 1.00 | 8.00 | 1.03 | 1 | 0.00 | 16.67 | 0.00 | 6.17 | 6.17 | 6.17 | 0.77 | 6.00 |
○Loop 892 | exec | update_halo_kernel.f90-pp.f90:168-169 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0.01 | 0.01 | 0.05 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | 0.00 | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 866 | exec | update_halo_kernel.f90-pp.f90:254-255 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0.01 | 0.01 | 0.05 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | 0.00 | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 738 | exec | update_halo_kernel.f90-pp.f90:649-650 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0.01 | 0.01 | 0.05 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | 0.00 | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 553 | exec | advec_mom_kernel.f90-pp.f90:138-138,advec_mom_kernel.f90-pp.f90:144-146 | advec_mom_kernel | Outermost | 0.01 | 0.01 | 0.05 | 1.00 | 1.00 | 4.96 | 5.44 | 1 | 0.00 | 23.21 | 0.00 | 12.25 | 12.25 | 12.25 | 2.47 | 2.25 |
○Loop 879 | exec | update_halo_kernel.f90-pp.f90:211-212 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 853 | exec | update_halo_kernel.f90-pp.f90:297-298 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 812 | exec | update_halo_kernel.f90-pp.f90:430-431 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 797 | exec | update_halo_kernel.f90-pp.f90:473-474 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 767 | exec | update_halo_kernel.f90-pp.f90:559-560 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 742 | exec | update_halo_kernel.f90-pp.f90:639-640 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 725 | exec | update_halo_kernel.f90-pp.f90:692-693 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 601 | exec | generate_chunk_kernel.f90-pp.f90:106-106 | __nv_generate_chunk_kernel_module_generate_chunk_kernel__F1L85_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 1.00 | 1.00 | 1 | 100.00 | 100.00 | NA | 1.00 | 1.00 | 1.00 | 1.00 | 1.00 |
○Loop 549 | exec | advec_mom_kernel.f90-pp.f90:184-185 | advec_mom_kernel | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 2.17 | 1 | 0.00 | 21.88 | NA | 2.17 | 2.17 | 2.17 | 0.54 | 1.00 |
○Loop 548 | exec | advec_mom_kernel.f90-pp.f90:183-186 | advec_mom_kernel | Outermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.96 | 3.15 | 3 | 0.00 | 21.09 | NA | 3.50 | 3.50 | 3.50 | 0.71 | 1.11 |
○Loop 595 | exec | generate_chunk_kernel.f90-pp.f90:130-137,generate_chunk_kernel.f90-pp.f90:166-166 | __nv_generate_chunk_kernel_module_generate_chunk_kernel__F1L85_1_ | Innermost | 0 | 0 | 0.02 | 1.48 | 1.00 | 4.61 | 5.67 | 5 | 21.05 | 28.95 | NA | 11.33 | 7.67 | 11.33 | 2.46 | 2.00 |
○Loop 546 | exec | advec_mom_kernel.f90-pp.f90:201-203,advec_mom_kernel.f90-pp.f90:209-210 | advec_mom_kernel | Outermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.55 | 7.40 | 1 | 0.00 | 23.79 | NA | 9.25 | 9.25 | 9.25 | 2.03 | 1.25 |
○Loop 706 | exec | update_halo_kernel.f90-pp.f90:745-746 | __nv_update_halo_kernel_module_update_halo_kernel__F1L93_1_ | Innermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.00 | 1.00 | 1 | 0.00 | 25.00 | NA | 1.00 | 1.00 | 1.00 | 0.25 | 1.00 |
○Loop 587 | exec | flux_calc_kernel.f90-pp.f90:54-56,flux_calc_kernel.f90-pp.f90:61-62 | __nv_flux_calc_kernel_module_flux_calc_kernel__F1L49_1_ | Outermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.39 | 7.00 | 2 | 0.00 | 24.26 | NA | 7.00 | 7.00 | 7.00 | 1.59 | 1.00 |
○Loop 575 | exec | calc_dt_kernel.f90-pp.f90:132-132 | __nv_calc_dt_kernel_module_calc_dt_kernel__F1L89_1_ | Outermost | 0 | 0 | 0.02 | 1.00 | 1.00 | 4.75 | 1.00 | 2 | 0.00 | 24.11 | NA | 8.00 | 8.00 | 8.00 | 1.68 | 8.00 |