| Function: advancePosition._omp_fn.0 | Module: exec | Source: timestep.c:85-94 | Coverage: 0.76% |
|---|
| Function: advancePosition._omp_fn.0 | Module: exec | Source: timestep.c:85-94 | Coverage: 0.76% |
|---|
/home/hbollore/qaas-runs/170-265-5545/intel/CoMD/build/CoMD/CoMD/src-openmp/timestep.c: 85 - 94 |
-------------------------------------------------------------------------------- |
85: #pragma omp parallel for |
86: for (int iBox=0; iBox<nBoxes; iBox++) |
87: { |
88: for (int iOff=MAXATOMS*iBox,ii=0; ii<s->boxes->nAtoms[iBox]; ii++,iOff++) |
89: { |
90: int iSpecies = s->atoms->iSpecies[iOff]; |
91: real_t invMass = 1.0/s->species[iSpecies].mass; |
92: s->atoms->r[iOff][0] += dt*s->atoms->p[iOff][0]*invMass; |
93: s->atoms->r[iOff][1] += dt*s->atoms->p[iOff][1]*invMass; |
94: s->atoms->r[iOff][2] += dt*s->atoms->p[iOff][2]*invMass; |
0x40c740 STP X29, X30, [SP, #976]! |
0x40c744 ADD X29, SP, #0 |
0x40c748 STR X21, [SP, #32] |
0x40c74c LDR W21, [X0, #16] |
0x40c750 STP X19, X20, [SP, #16] |
0x40c754 ORR X20, XZR, X0 |
0x40c758 BL 4024a0 |
0x40c75c ORR W19, WZR, W0 |
0x40c760 BL 4023f0 |
0x40c764 SDIV W1, W21, W19 |
0x40c768 ORR W14, WZR, W0 |
0x40c76c MSUB W2, W1, W19, W21 |
0x40c770 CMP W0, W2 |
0x40c774 B.LT 40c930 |
(115) 0x40c778 MADD W3, W1, W14, W2 |
(115) 0x40c77c ADD W16, W1, W3 |
(115) 0x40c780 CMP W3, W16 |
(115) 0x40c784 B.GE 40c920 |
(113) 0x40c788 LDR X17, [X20] |
(113) 0x40c78c UBFM W15, W3, #26, #25 |
(113) 0x40c790 MOVZ W0, #24 |
(113) 0x40c794 FMOV D4, #1.0000000 |
(113) 0x40c798 SBFM X14, X3, #0, #31 |
(113) 0x40c79c LDR D0, [X20, #8] |
(113) 0x40c7a0 SMADDL X15, W15, W0, XZR |
(113) 0x40c7a4 LDR X4, [X17, #24] |
(113) 0x40c7a8 LDR X18, [X4, #120] |
(113) 0x40c7ac LDR W5, [X18, X14,LSL #2] |
(113) 0x40c7b0 CMP W5, #0 |
(113) 0x40c7b4 B.LE 40c910 |
(113) 0x40c7b8 LDP X10, X13, [X17, #32] |
(113) 0x40c7bc SUB W9, W5, #1 |
(113) 0x40c7c0 UBFM X7, X14, #56, #55 |
(113) 0x40c7c4 ADD X8, X9, X14,LSL #6 |
(113) 0x40c7c8 ORR X0, XZR, X15 |
(113) 0x40c7cc LDP X6, X30, [X10, #16] |
(113) 0x40c7d0 LDR X20, [X10, #32] |
(113) 0x40c7d4 ADD X11, X6, #4 |
(113) 0x40c7d8 ADD X3, X6, X7 |
(113) 0x40c7dc ADD X21, X11, X8,LSL #2 |
(113) 0x40c7e0 ADD X19, X30, #8 |
(113) 0x40c7e4 ADD X2, X30, #16 |
(113) 0x40c7e8 SUB X1, X21, X3 |
(113) 0x40c7ec ADD X12, X20, #8 |
(113) 0x40c7f0 ADD X4, X20, #16 |
(113) 0x40c7f4 TBZ W1, #2, 40c860 |
0x40c7f8 LDRSW X5, [X6, X7] |
0x40c7fc ADD X3, X3, #4 |
0x40c800 ADD X0, X15, #24 |
0x40c804 LDR D3, [X20, X15] |
0x40c808 LDR D2, [X30, X15] |
0x40c80c ADD X9, X13, X5,LSL #4 |
0x40c810 LDR D1, [X9, #8] |
0x40c814 FMUL D5, D0, D3 |
0x40c818 FDIV D6, D4, D1 |
0x40c81c FMADD D7, D6, D5, D2 |
0x40c820 STR D7, [X30, X15] |
0x40c824 LDR D16, [X12, X15] |
0x40c828 LDR D17, [X19, X15] |
0x40c82c FMUL D18, D0, D16 |
0x40c830 FMADD D19, D6, D18, D17 |
0x40c834 STR D19, [X19, X15] |
0x40c838 LDR D20, [X4, X15] |
0x40c83c LDR D21, [X2, X15] |
0x40c840 FMUL D22, D0, D20 |
0x40c844 FMADD D23, D6, D22, D21 |
0x40c848 STR D23, [X2, X15] |
0x40c84c CMP X3, X21 |
0x40c850 B.EQ 40c910 |
0x40c854 HINT #0 |
0x40c858 HINT #0 |
0x40c85c HINT #0 |
(114) 0x40c860 ORR X8, XZR, X3 |
(114) 0x40c864 LDR D24, [X20, X0] |
(114) 0x40c868 ADD X10, X0, #24 |
(114) 0x40c86c LDRSW X7, [X8], #4 |
(114) 0x40c870 LDR D25, [X30, X0] |
(114) 0x40c874 FMUL D26, D0, D24 |
(114) 0x40c878 LDRSW X6, [X3, #4] |
(114) 0x40c87c ADD X11, X13, X7,LSL #4 |
(114) 0x40c880 ADD X3, X8, #4 |
(114) 0x40c884 LDR D27, [X11, #8] |
(114) 0x40c888 ADD X1, X13, X6,LSL #4 |
(114) 0x40c88c FDIV D28, D4, D27 |
(114) 0x40c890 FMADD D29, D28, D26, D25 |
(114) 0x40c894 STR D29, [X30, X0] |
(114) 0x40c898 LDR D30, [X12, X0] |
(114) 0x40c89c LDR D31, [X19, X0] |
(114) 0x40c8a0 FMUL D3, D0, D30 |
(114) 0x40c8a4 FMADD D2, D28, D3, D31 |
(114) 0x40c8a8 STR D2, [X19, X0] |
(114) 0x40c8ac LDR D5, [X4, X0] |
(114) 0x40c8b0 LDR D1, [X2, X0] |
(114) 0x40c8b4 FMUL D6, D0, D5 |
(114) 0x40c8b8 FMADD D7, D28, D6, D1 |
(114) 0x40c8bc STR D7, [X2, X0] |
(114) 0x40c8c0 ADD X0, X0, #48 |
(114) 0x40c8c4 LDR D19, [X1, #8] |
(114) 0x40c8c8 LDR D16, [X20, X10] |
(114) 0x40c8cc LDR D17, [X30, X10] |
(114) 0x40c8d0 FDIV D20, D4, D19 |
(114) 0x40c8d4 FMUL D18, D0, D16 |
(114) 0x40c8d8 FMADD D21, D20, D18, D17 |
(114) 0x40c8dc STR D21, [X30, X10] |
(114) 0x40c8e0 LDR D22, [X12, X10] |
(114) 0x40c8e4 LDR D23, [X19, X10] |
(114) 0x40c8e8 FMUL D24, D0, D22 |
(114) 0x40c8ec FMADD D25, D20, D24, D23 |
(114) 0x40c8f0 STR D25, [X19, X10] |
(114) 0x40c8f4 LDR D26, [X4, X10] |
(114) 0x40c8f8 LDR D27, [X2, X10] |
(114) 0x40c8fc FMUL D28, D0, D26 |
(114) 0x40c900 FMADD D29, D20, D28, D27 |
(114) 0x40c904 STR D29, [X2, X10] |
(114) 0x40c908 CMP X3, X21 |
(114) 0x40c90c B.NE 40c860 |
(113) 0x40c910 ADD X14, X14, #1 |
(113) 0x40c914 ADD X15, X15, #1536 |
(113) 0x40c918 CMP W16, W14 |
(113) 0x40c91c B.GT 40c7ac |
(115) 0x40c920 LDP X19, X20, [SP, #16] |
(115) 0x40c924 LDR X21, [SP, #32] |
(115) 0x40c928 LDP X29, X30, [SP], #48 |
(115) 0x40c92c RET |
(115) 0x40c930 ADD W1, W1, #1 |
(115) 0x40c934 MOVZ W2, #0 |
(115) 0x40c938 B 40c778 |
0x40c93c HINT #0 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►97.93+ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
| ○ | __kmp_invoke_microtask | libomp.so | |
| ►2.07+ | GOMP_parallel | libomp.so | |
| ○ | timestep | timestep.c:43 | exec |
| ○ | main | CoMD.c:125 | exec |
| ○ | __libc_start_main | libc-2.31.so | |
| ○ | _start | CoMD.c:266 | exec |
| Path / |
| Source file and lines | timestep.c:85-94 |
| Module | exec |
| nb instructions | 41 |
| loop length | 164 |
| nb stack references | 0 |
| front end | 4.63 cycles |
| P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 2.00 | 2.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.50 | 2.50 | 2.50 | 2.50 | 5.00 | 5.00 | 5.00 | 1.50 | 1.50 |
| cycles | 2.00 | 2.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.50 | 2.50 | 2.50 | 2.50 | 5.00 | 5.00 | 5.00 | 1.50 | 1.50 |
| Cycles executing div or sqrt instructions | 2.00-1.00 |
| Front-end | 4.63 |
| Overall L1 | 5.00 |
| all | 0% |
| load | 0% |
| store | 0% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | 0% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | 0% |
| other | 0% |
| Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| STP X29, X30, [SP, #976]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
| ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| STR X21, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
| LDR W21, [X0, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
| STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
| ORR X20, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| BL 4024a0 <@plt_start@+0x280> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| ORR W19, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| BL 4023f0 <@plt_start@+0x1d0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| SDIV W1, W21, W19 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 1-0.50 |
| ORR W14, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| MSUB W2, W1, W19, W21 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
| CMP W0, W2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
| B.LT 40c930 <advancePosition._omp_fn.0+0x1f0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| LDRSW X5, [X6, X7] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
| ADD X3, X3, #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| ADD X0, X15, #24 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| LDR D3, [X20, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| LDR D2, [X30, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| ADD X9, X13, X5,LSL #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| LDR D1, [X9, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| FMUL D5, D0, D3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
| FDIV D6, D4, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 7-15 | 1-0.50 |
| FMADD D7, D6, D5, D2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
| STR D7, [X30, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| LDR D16, [X12, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| LDR D17, [X19, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| FMUL D18, D0, D16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
| FMADD D19, D6, D18, D17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
| STR D19, [X19, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| LDR D20, [X4, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| LDR D21, [X2, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| FMUL D22, D0, D20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
| FMADD D23, D6, D22, D21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
| STR D23, [X2, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| CMP X3, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
| B.EQ 40c910 <advancePosition._omp_fn.0+0x1d0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| HINT #0 | ||||||||||||||||||
| HINT #0 | ||||||||||||||||||
| HINT #0 | ||||||||||||||||||
| HINT #0 |
| Source file and lines | timestep.c:85-94 |
| Module | exec |
| nb instructions | 41 |
| loop length | 164 |
| nb stack references | 0 |
| front end | 4.63 cycles |
| P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 2.00 | 2.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.50 | 2.50 | 2.50 | 2.50 | 5.00 | 5.00 | 5.00 | 1.50 | 1.50 |
| cycles | 2.00 | 2.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.50 | 2.50 | 2.50 | 2.50 | 5.00 | 5.00 | 5.00 | 1.50 | 1.50 |
| Cycles executing div or sqrt instructions | 2.00-1.00 |
| Front-end | 4.63 |
| Overall L1 | 5.00 |
| all | 0% |
| load | 0% |
| store | 0% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | 0% |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | 0% |
| other | 0% |
| Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| STP X29, X30, [SP, #976]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
| ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| STR X21, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
| LDR W21, [X0, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
| STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
| ORR X20, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| BL 4024a0 <@plt_start@+0x280> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| ORR W19, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| BL 4023f0 <@plt_start@+0x1d0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| SDIV W1, W21, W19 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 1-0.50 |
| ORR W14, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| MSUB W2, W1, W19, W21 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
| CMP W0, W2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
| B.LT 40c930 <advancePosition._omp_fn.0+0x1f0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| LDRSW X5, [X6, X7] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
| ADD X3, X3, #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| ADD X0, X15, #24 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| LDR D3, [X20, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| LDR D2, [X30, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| ADD X9, X13, X5,LSL #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
| LDR D1, [X9, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| FMUL D5, D0, D3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
| FDIV D6, D4, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 7-15 | 1-0.50 |
| FMADD D7, D6, D5, D2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
| STR D7, [X30, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| LDR D16, [X12, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| LDR D17, [X19, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| FMUL D18, D0, D16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
| FMADD D19, D6, D18, D17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
| STR D19, [X19, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| LDR D20, [X4, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| LDR D21, [X2, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
| FMUL D22, D0, D20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
| FMADD D23, D6, D22, D21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
| STR D23, [X2, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
| CMP X3, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
| B.EQ 40c910 <advancePosition._omp_fn.0+0x1d0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
| HINT #0 | ||||||||||||||||||
| HINT #0 | ||||||||||||||||||
| HINT #0 | ||||||||||||||||||
| HINT #0 |
| Name | Coverage (%) | Time (s) |
|---|---|---|
| ▼advancePosition._omp_fn.0– | 0.76 | 0.13 |
| ▼Loop 113 - timestep.c:85-94 - exec– | 0 | 0 |
| ○Loop 114 - timestep.c:88-94 - exec | 0.71 | 0.12 |
| ○Loop 115 - timestep.c:85-86 - exec | 0 | 0 |
