| Function: k_means(int, point_t*, point_t*, int*, int, int) [clone ._omp_fn.1] | Module: kmeans-gcc-Ofast | Source: main.cpp:138-143 | Coverage (incl. loops): 0.02% | (excl. loops): 0.00% |
|---|
| Function: k_means(int, point_t*, point_t*, int*, int, int) [clone ._omp_fn.1] | Module: kmeans-gcc-Ofast | Source: main.cpp:138-143 | Coverage (incl. loops): 0.02% | (excl. loops): 0.00% |
|---|
/home/fmusial/KMEANS_Benchmarks/kmeans/main.cpp: 138 - 143 |
-------------------------------------------------------------------------------- |
138: #pragma omp parallel for reduction(+:sum_x[:k], sum_y[:k], count[:k]) |
139: for (int i = 0; i < n; ++i) { |
140: int cid = assignment[i]; |
141: count[cid] += 1; |
142: sum_x[cid] += points[i].x; |
143: sum_y[cid] += points[i].y; |
0x401e60 STP X29, X30, [SP, #912]! |
0x401e64 ADD X29, SP, #0 |
0x401e68 CNTW X2, ALL |
0x401e6c STP X25, X26, [SP, #64] |
0x401e70 ORR X25, XZR, X0 |
0x401e74 SUB X0, X2, #1 |
0x401e78 STP X19, X20, [SP, #16] |
0x401e7c STP X21, X22, [SP, #32] |
0x401e80 STP X23, X24, [SP, #48] |
0x401e84 STP X27, X28, [SP, #80] |
0x401e88 LDP X1, X26, [X25] |
0x401e8c LDR X20, [X25, #80] |
0x401e90 STR X1, [X29, #96] |
0x401e94 LDP X24, X22, [X25, #64] |
0x401e98 UBFM X1, X24, #61, #60 |
0x401e9c SUB X3, X24, #13 |
0x401ea0 ADD X1, X1, #23 |
0x401ea4 CMP X24, X0 |
0x401ea8 AND X1, X1, #7932 |
0x401eac CCMN X3, #15, #2, #2 |
0x401eb0 LDR W3, [X25, #88] |
0x401eb4 SUB SP, SP, X1,UXTX |
0x401eb8 ADD X23, SP, #0 |
0x401ebc B.HI 4023d4 |
0x401ec0 ADDVL X5, SP, #1 |
0x401ec4 SUB X0, X24, X0 |
0x401ec8 PTRUE P7.B, ALL |
0x401ecc MOVN X1, #0 |
0x401ed0 ADD X4, SP, #8 |
0x401ed4 DUP Z31.D, #0 |
0x401ed8 ADD X5, X5, #8 |
0x401edc HINT #0 |
(21) 0x401ee0 ST1D {Z31.D}, P7, [X4, X1,LSL #3] |
(21) 0x401ee4 ORR X6, XZR, X1 |
(21) 0x401ee8 ST1D {Z31.D}, P7, [X5, X1,LSL #3] |
(21) 0x401eec ADD X1, X1, X2 |
(21) 0x401ef0 CMP X0, X1 |
(21) 0x401ef4 B.HI 401ee0 |
0x401ef8 ADDPL X2, X6, #2 |
0x401efc ADD X2, X2, #1 |
0x401f00 UBFM X0, X2, #61, #60 |
0x401f04 CMP X24, X1 |
0x401f08 B.EQ 401f30 |
0x401f0c SUB X1, X0, X1,LSL #3 |
0x401f10 SUB X1, X1, #8 |
0x401f14 ADD X1, X23, X1 |
0x401f18 HINT #0 |
0x401f1c HINT #0 |
(22) 0x401f20 STR XZR, [X1, X2,LSL #3] |
(22) 0x401f24 ADD X2, X2, #1 |
(22) 0x401f28 CMP X24, X2 |
(22) 0x401f2c B.CS 401f20 |
0x401f30 UBFM X1, X22, #61, #60 |
0x401f34 CNTW X2, ALL |
0x401f38 ADD X1, X1, #23 |
0x401f3c SUB X0, X2, #1 |
0x401f40 AND X1, X1, #7932 |
0x401f44 CMP X22, X0 |
0x401f48 SUB X4, X22, #13 |
0x401f4c SUB SP, SP, X1,UXTX |
0x401f50 CCMN X4, #15, #2, #2 |
0x401f54 ADD X21, SP, #0 |
0x401f58 B.HI 4023f4 |
0x401f5c ADDVL X5, SP, #1 |
0x401f60 SUB X0, X22, X0 |
0x401f64 PTRUE P7.B, ALL |
0x401f68 MOVN X1, #0 |
0x401f6c ADD X4, SP, #8 |
0x401f70 DUP Z30.D, #0 |
0x401f74 ADD X5, X5, #8 |
0x401f78 HINT #0 |
0x401f7c HINT #0 |
(19) 0x401f80 ST1D {Z30.D}, P7, [X4, X1,LSL #3] |
(19) 0x401f84 ORR X6, XZR, X1 |
(19) 0x401f88 ST1D {Z30.D}, P7, [X5, X1,LSL #3] |
(19) 0x401f8c ADD X1, X1, X2 |
(19) 0x401f90 CMP X0, X1 |
(19) 0x401f94 B.HI 401f80 |
0x401f98 ADDPL X2, X6, #2 |
0x401f9c ADD X2, X2, #1 |
0x401fa0 UBFM X0, X2, #61, #60 |
0x401fa4 CMP X22, X1 |
0x401fa8 B.EQ 401fd0 |
0x401fac SUB X1, X0, X1,LSL #3 |
0x401fb0 SUB X1, X1, #8 |
0x401fb4 ADD X1, X21, X1 |
0x401fb8 HINT #0 |
0x401fbc HINT #0 |
(20) 0x401fc0 STR XZR, [X1, X2,LSL #3] |
(20) 0x401fc4 ADD X2, X2, #1 |
(20) 0x401fc8 CMP X22, X2 |
(20) 0x401fcc B.CS 401fc0 |
0x401fd0 ADD X28, X20, #1 |
0x401fd4 CNTD X1, ALL |
0x401fd8 UBFM X0, X28, #62, #61 |
0x401fdc SUB X1, X1, #1 |
0x401fe0 ADD X0, X0, #15 |
0x401fe4 CMP X20, X1 |
0x401fe8 AND X0, X0, #7932 |
0x401fec SUB X1, X20, #16 |
0x401ff0 SUB SP, SP, X0,UXTX |
0x401ff4 CCMN X1, #18, #2, #2 |
0x401ff8 ADD X27, SP, #0 |
0x401ffc B.HI 4023b0 |
0x402000 CNTH X2, ALL |
0x402004 SUB X0, X2, #1 |
0x402008 CMP X20, X0 |
0x40200c B.CC 402434 |
0x402010 ADDVL X6, SP, #1 |
0x402014 SUB X0, X20, X0 |
0x402018 PTRUE P7.B, ALL |
0x40201c MOVN X1, #0 |
0x402020 ADD X4, SP, #4 |
0x402024 DUP Z29.B, #0 |
0x402028 ADD X6, X6, #4 |
(18) 0x40202c ST1W {Z29.S}, P7, [X4, X1,LSL #2] |
(18) 0x402030 ORR X5, XZR, X1 |
(18) 0x402034 ST1W {Z29.S}, P7, [X6, X1,LSL #2] |
(18) 0x402038 ADD X1, X1, X2 |
(18) 0x40203c CMP X0, X1 |
(18) 0x402040 B.HI 40202c |
0x402044 ADDPL X2, X5, #4 |
0x402048 ADD X2, X2, #1 |
0x40204c ADD X4, X27, X2,LSL #2 |
0x402050 CMP X20, X1 |
0x402054 B.EQ 4020d0 |
0x402058 CNTD X5, ALL |
0x40205c SUB X0, X20, X2 |
0x402060 ADD X1, X5, #4 |
0x402064 SUB X8, X28, X2 |
0x402068 CMP X0, X1 |
0x40206c B.CC 4020b4 |
0x402070 ADD X0, X2, #1 |
0x402074 SUB X7, X8, X5 |
0x402078 PTRUE P7.B, ALL |
0x40207c ADD X0, X27, X0,LSL #2 |
0x402080 MOVN X1, #0 |
0x402084 DUP Z28.B, #0 |
(17) 0x402088 ORR X6, XZR, X1 |
(17) 0x40208c ST1W {Z28.D}, P7, [X0, X1,LSL #2] |
(17) 0x402090 ADD X1, X1, X5 |
(17) 0x402094 CMP X7, X1 |
(17) 0x402098 B.HI 402088 |
0x40209c ADDPL X0, X6, #1 |
0x4020a0 ADD X0, X0, #1 |
0x4020a4 ADD X4, X4, X0,LSL #2 |
0x4020a8 ADD X2, X2, X0 |
0x4020ac CMP X8, X0 |
0x4020b0 B.EQ 4020d0 |
0x4020b4 SUB X0, X4, X2,LSL #2 |
0x4020b8 HINT #0 |
0x4020bc HINT #0 |
(16) 0x4020c0 STR WZR, [X0, X2,LSL #2] |
(16) 0x4020c4 ADD X2, X2, #1 |
(16) 0x4020c8 CMP X20, X2 |
(16) 0x4020cc B.CS 4020c0 |
0x4020d0 STR W3, [X29, #104] |
0x4020d4 BL 401930 |
0x4020d8 ORR W19, WZR, W0 |
0x4020dc BL 401880 |
0x4020e0 LDR W3, [X29, #104] |
0x4020e4 ORR W1, WZR, W0 |
0x4020e8 SDIV W5, W3, W19 |
0x4020ec MSUB W0, W5, W19, W3 |
0x4020f0 CMP W1, W0 |
0x4020f4 B.LT 4023a4 |
(10) 0x4020f8 MADD W1, W5, W1, W0 |
(10) 0x4020fc ADD W5, W5, W1 |
(10) 0x402100 CMP W1, W5 |
(10) 0x402104 B.GE 40215c |
(10) 0x402108 LDR X2, [X29, #96] |
(10) 0x40210c SBFM X0, X1, #0, #31 |
(10) 0x402110 ADD X1, X2, W1,SXTW #4 |
(10) 0x402114 HINT #0 |
(10) 0x402118 HINT #0 |
(10) 0x40211c HINT #0 |
(15) 0x402120 LDR W2, [X26, X0,LSL #2] |
(15) 0x402124 ADD X0, X0, #1 |
(15) 0x402128 LDP D24, D26, [X1], #16 |
(15) 0x40212c LDR D25, [X23, X2,SXTW #3] |
(15) 0x402130 SBFM X4, X2, #62, #31 |
(15) 0x402134 LDR D27, [X21, X2,SXTW #3] |
(15) 0x402138 LDR W3, [X27, X4] |
(15) 0x40213c FADD D24, D25, D24 |
(15) 0x402140 FADD D26, D27, D26 |
(15) 0x402144 ADD W3, W3, #1 |
(15) 0x402148 STR W3, [X27, X4] |
(15) 0x40214c STR D24, [X23, X2,SXTW #3] |
(15) 0x402150 STR D26, [X21, X2,SXTW #3] |
(15) 0x402154 CMP W5, W0 |
(15) 0x402158 B.GT 402120 |
(10) 0x40215c LDR X2, [X25, #24] |
(10) 0x402160 LDR X26, [X25, #40] |
(10) 0x402164 LDR X19, [X25, #56] |
(10) 0x402168 STR X2, [X29, #104] |
(10) 0x40216c BL 401760 |
(10) 0x402170 CNTD X3, ALL |
(10) 0x402174 LDR X2, [X29, #104] |
(10) 0x402178 ADD X0, X3, #1 |
(10) 0x40217c CMP X24, X0 |
(10) 0x402180 B.CC 402414 |
(10) 0x402184 ADDPL X6, X24, #63 |
(10) 0x402188 MOVN X0, #0 |
(10) 0x40218c PTRUE P7.B, ALL |
(10) 0x402190 ADD X6, X6, #1 |
(10) 0x402194 ADD X4, X23, #8 |
(10) 0x402198 ADD X1, X26, #8 |
(10) 0x40219c HINT #0 |
(14) 0x4021a0 LD1D {Z23.D}, P7/Z, [X1, X0,LSL #3] |
(14) 0x4021a4 LD1D {Z22.D}, P7/Z, [X4, X0,LSL #3] |
(14) 0x4021a8 ORR X5, XZR, X0 |
(14) 0x4021ac FADD Z22.D, Z23.D, Z22.D |
(14) 0x4021b0 ST1D {Z22.D}, P7, [X1, X0,LSL #3] |
(14) 0x4021b4 ADD X0, X0, X3 |
(14) 0x4021b8 CMP X6, X0 |
(14) 0x4021bc B.HI 4021a0 |
(10) 0x4021c0 ADDPL X1, X5, #1 |
(10) 0x4021c4 ADD X1, X1, #1 |
(10) 0x4021c8 ADD X23, X23, X1,LSL #3 |
(10) 0x4021cc ADD X26, X26, X1,LSL #3 |
(10) 0x4021d0 CMP X24, X0 |
(10) 0x4021d4 B.EQ 4021fc |
(10) 0x4021d8 SUB X0, X26, X1,LSL #3 |
(10) 0x4021dc SUB X23, X23, X1,LSL #3 |
(7) 0x4021e0 LDR D21, [X0, X1,LSL #3] |
(7) 0x4021e4 LDR D20, [X23, X1,LSL #3] |
(7) 0x4021e8 FADD D20, D21, D20 |
(7) 0x4021ec STR D20, [X0, X1,LSL #3] |
(7) 0x4021f0 ADD X1, X1, #1 |
(7) 0x4021f4 CMP X24, X1 |
(7) 0x4021f8 B.CS 4021e0 |
(10) 0x4021fc CNTD X3, ALL |
(10) 0x402200 ADD X0, X3, #1 |
(10) 0x402204 CMP X22, X0 |
(10) 0x402208 B.CC 40241c |
(10) 0x40220c ADDPL X6, X22, #63 |
(10) 0x402210 MOVN X0, #0 |
(10) 0x402214 PTRUE P7.B, ALL |
(10) 0x402218 ADD X6, X6, #1 |
(10) 0x40221c ADD X4, X21, #8 |
(10) 0x402220 ADD X1, X19, #8 |
(13) 0x402224 LD1D {Z19.D}, P7/Z, [X1, X0,LSL #3] |
(13) 0x402228 LD1D {Z18.D}, P7/Z, [X4, X0,LSL #3] |
(13) 0x40222c ORR X5, XZR, X0 |
(13) 0x402230 FADD Z18.D, Z19.D, Z18.D |
(13) 0x402234 ST1D {Z18.D}, P7, [X1, X0,LSL #3] |
(13) 0x402238 ADD X0, X0, X3 |
(13) 0x40223c CMP X6, X0 |
(13) 0x402240 B.HI 402224 |
(10) 0x402244 ADDPL X1, X5, #1 |
(10) 0x402248 ADD X1, X1, #1 |
(10) 0x40224c ADD X21, X21, X1,LSL #3 |
(10) 0x402250 ADD X19, X19, X1,LSL #3 |
(10) 0x402254 CMP X22, X0 |
(10) 0x402258 B.EQ 402280 |
(10) 0x40225c SUB X0, X19, X1,LSL #3 |
(10) 0x402260 SUB X21, X21, X1,LSL #3 |
(8) 0x402264 LDR D17, [X0, X1,LSL #3] |
(8) 0x402268 LDR D16, [X21, X1,LSL #3] |
(8) 0x40226c FADD D16, D17, D16 |
(8) 0x402270 STR D16, [X0, X1,LSL #3] |
(8) 0x402274 ADD X1, X1, #1 |
(8) 0x402278 CMP X22, X1 |
(8) 0x40227c B.CS 402264 |
(10) 0x402280 CNTW X3, ALL |
(10) 0x402284 ADD X0, X3, #3 |
(10) 0x402288 CMP X20, X0 |
(10) 0x40228c B.CC 402424 |
(10) 0x402290 ADDPL X6, X20, #62 |
(10) 0x402294 MOVN X0, #0 |
(10) 0x402298 PTRUE P7.B, ALL |
(10) 0x40229c ADD X6, X6, #1 |
(10) 0x4022a0 ADD X4, X27, #4 |
(10) 0x4022a4 ADD X1, X2, #4 |
(12) 0x4022a8 LD1W {Z7.S}, P7/Z, [X1, X0,LSL #2] |
(12) 0x4022ac LD1W {Z6.S}, P7/Z, [X4, X0,LSL #2] |
(12) 0x4022b0 ORR X5, XZR, X0 |
(12) 0x4022b4 ADD Z6.S, Z7.S, Z6.S |
(12) 0x4022b8 ST1W {Z6.S}, P7, [X1, X0,LSL #2] |
(12) 0x4022bc ADD X0, X0, X3 |
(12) 0x4022c0 CMP X0, X6 |
(12) 0x4022c4 B.CC 4022a8 |
(10) 0x4022c8 ADDPL X1, X5, #2 |
(10) 0x4022cc ADD X1, X1, #1 |
(10) 0x4022d0 ADD X5, X27, X1,LSL #2 |
(10) 0x4022d4 ADD X3, X2, X1,LSL #2 |
(10) 0x4022d8 CMP X20, X0 |
(10) 0x4022dc B.EQ 402380 |
(10) 0x4022e0 CNTD X6, ALL |
(10) 0x4022e4 SUB X0, X20, X1 |
(10) 0x4022e8 ADD X4, X6, #1 |
(10) 0x4022ec SUB X28, X28, X1 |
(10) 0x4022f0 CMP X0, X4 |
(10) 0x4022f4 B.CC 40235c |
(10) 0x4022f8 UBFM X4, X1, #62, #61 |
(10) 0x4022fc SUB X8, X28, X6 |
(10) 0x402300 PTRUE P7.B, ALL |
(10) 0x402304 ADD X4, X4, #4 |
(10) 0x402308 MOVN X0, #0 |
(10) 0x40230c ADD X2, X2, X4 |
(10) 0x402310 ADD X4, X27, X4 |
(10) 0x402314 HINT #0 |
(10) 0x402318 HINT #0 |
(10) 0x40231c HINT #0 |
(11) 0x402320 LD1W {Z5.D}, P7/Z, [X2, X0,LSL #2] |
(11) 0x402324 LD1W {Z4.D}, P7/Z, [X4, X0,LSL #2] |
(11) 0x402328 ORR X7, XZR, X0 |
(11) 0x40232c ADD Z4.S, Z5.S, Z4.S |
(11) 0x402330 ST1W {Z4.D}, P7, [X2, X0,LSL #2] |
(11) 0x402334 ADD X0, X0, X6 |
(11) 0x402338 CMP X8, X0 |
(11) 0x40233c B.HI 402320 |
(10) 0x402340 ADDPL X0, X7, #1 |
(10) 0x402344 ADD X0, X0, #1 |
(10) 0x402348 ADD X5, X5, X0,LSL #2 |
(10) 0x40234c ADD X1, X1, X0 |
(10) 0x402350 ADD X3, X3, X0,LSL #2 |
(10) 0x402354 CMP X28, X0 |
(10) 0x402358 B.EQ 402380 |
(10) 0x40235c SUB X2, X3, X1,LSL #2 |
(10) 0x402360 SUB X4, X5, X1,LSL #2 |
(9) 0x402364 LDR W0, [X2, X1,LSL #2] |
(9) 0x402368 LDR W3, [X4, X1,LSL #2] |
(9) 0x40236c ADD W0, W0, W3 |
(9) 0x402370 STR W0, [X2, X1,LSL #2] |
(9) 0x402374 ADD X1, X1, #1 |
(9) 0x402378 CMP X20, X1 |
(9) 0x40237c B.CS 402364 |
(10) 0x402380 BL 4017c0 |
(10) 0x402384 ADD SP, X29, #0 |
(10) 0x402388 LDP X19, X20, [SP, #16] |
(10) 0x40238c LDP X21, X22, [SP, #32] |
(10) 0x402390 LDP X23, X24, [SP, #48] |
(10) 0x402394 LDP X25, X26, [SP, #64] |
(10) 0x402398 LDP X27, X28, [SP, #80] |
(10) 0x40239c LDP X29, X30, [SP], #112 |
(10) 0x4023a0 RET |
(10) 0x4023a4 ADD W5, W5, #1 |
(10) 0x4023a8 MOVZ W0, #0 |
(10) 0x4023ac B 4020f8 |
0x4023b0 MOVZ X0, #0 |
0x4023b4 HINT #0 |
0x4023b8 HINT #0 |
0x4023bc HINT #0 |
(6) 0x4023c0 STR WZR, [X27, X0,LSL #2] |
(6) 0x4023c4 ADD X0, X0, #1 |
(6) 0x4023c8 CMP X20, X0 |
(6) 0x4023cc B.CS 4023c0 |
0x4023d0 B 4020d0 |
0x4023d4 MOVZ X0, #0 |
0x4023d8 HINT #0 |
0x4023dc HINT #0 |
(4) 0x4023e0 STR XZR, [X23, X0,LSL #3] |
(4) 0x4023e4 ADD X0, X0, #1 |
(4) 0x4023e8 CMP X24, X0 |
(4) 0x4023ec B.CS 4023e0 |
0x4023f0 B 401f30 |
0x4023f4 MOVZ X0, #0 |
0x4023f8 HINT #0 |
0x4023fc HINT #0 |
(5) 0x402400 STR XZR, [X21, X0,LSL #3] |
(5) 0x402404 ADD X0, X0, #1 |
(5) 0x402408 CMP X22, X0 |
(5) 0x40240c B.CS 402400 |
0x402410 B 401fd0 |
(10) 0x402414 MOVZ X1, #0 |
(10) 0x402418 B 4021d8 |
(10) 0x40241c MOVZ X1, #0 |
(10) 0x402420 B 40225c |
(10) 0x402424 MOVZ X1, #0 |
(10) 0x402428 ORR X3, XZR, X2 |
(10) 0x40242c ORR X5, XZR, X27 |
(10) 0x402430 B 4022e0 |
0x402434 MOVZ X2, #0 |
0x402438 ADD X4, SP, #0 |
0x40243c B 402058 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►100.00+ | GOMP_parallel | libgomp.h:980 | libgomp.so.1.0.0 |
| ○ | k_means(int, point_t*, point_t[...] | main.cpp:146 | kmeans-gcc-Ofast |
| ○ | main | main.cpp:188 | kmeans-gcc-Ofast |
| ○ | __libc_init_first | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | new_allocator.h:104 | kmeans-gcc-Ofast |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►100.00+ | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
| ○ | pthread_condattr_setpshared | libc.so.6 | |
| ○ | __clone | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►62.50+ | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
| ○ | pthread_condattr_setpshared | libc.so.6 | |
| ○ | __clone | libc.so.6 | |
| ►37.50+ | GOMP_parallel | libgomp.h:980 | libgomp.so.1.0.0 |
| ○ | k_means(int, point_t*, point_t[...] | main.cpp:146 | kmeans-gcc-Ofast |
| ○ | main | main.cpp:188 | kmeans-gcc-Ofast |
| ○ | __libc_init_first | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | new_allocator.h:104 | kmeans-gcc-Ofast |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►95.24+ | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
| ○ | pthread_condattr_setpshared | libc.so.6 | |
| ○ | __clone | libc.so.6 | |
| ►4.76+ | GOMP_parallel | libgomp.h:980 | libgomp.so.1.0.0 |
| ○ | k_means(int, point_t*, point_t[...] | main.cpp:146 | kmeans-gcc-Ofast |
| ○ | main | main.cpp:188 | kmeans-gcc-Ofast |
| ○ | __libc_init_first | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | new_allocator.h:104 | kmeans-gcc-Ofast |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►92.21+ | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
| ○ | pthread_condattr_setpshared | libc.so.6 | |
| ○ | __clone | libc.so.6 | |
| ►7.79+ | GOMP_parallel | libgomp.h:980 | libgomp.so.1.0.0 |
| ○ | k_means(int, point_t*, point_t[...] | main.cpp:146 | kmeans-gcc-Ofast |
| ○ | main | main.cpp:188 | kmeans-gcc-Ofast |
| ○ | __libc_init_first | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | new_allocator.h:104 | kmeans-gcc-Ofast |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►95.67+ | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
| ○ | pthread_condattr_setpshared | libc.so.6 | |
| ○ | __clone | libc.so.6 | |
| ►4.33+ | GOMP_parallel | libgomp.h:980 | libgomp.so.1.0.0 |
| ○ | k_means(int, point_t*, point_t[...] | main.cpp:146 | kmeans-gcc-Ofast |
| ○ | main | main.cpp:188 | kmeans-gcc-Ofast |
| ○ | __libc_init_first | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | new_allocator.h:104 | kmeans-gcc-Ofast |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►98.18+ | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
| ○ | pthread_condattr_setpshared | libc.so.6 | |
| ○ | __clone | libc.so.6 | |
| ►1.82+ | GOMP_parallel | libgomp.h:980 | libgomp.so.1.0.0 |
| ○ | k_means(int, point_t*, point_t[...] | main.cpp:146 | kmeans-gcc-Ofast |
| ○ | main | main.cpp:188 | kmeans-gcc-Ofast |
| ○ | __libc_init_first | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | new_allocator.h:104 | kmeans-gcc-Ofast |
| min | med | avg | max |
|---|---|---|---|
| Percentile Index | 10 | 20 | 30 | 40 | 50 | 60 | 70 | 80 | 90 | 100 |
|---|---|---|---|---|---|---|---|---|---|---|
| Value |
| min | med | avg | max |
|---|---|---|---|
| Percentile Index | 10 | 20 | 30 | 40 | 50 | 60 | 70 | 80 | 90 | 100 |
|---|---|---|---|---|---|---|---|---|---|---|
| Value |
| Path / |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run run_1_thread
| Source file and lines | main.cpp:138-143 |
| Module | kmeans-gcc-Ofast |
| nb instructions | 147 |
| nb uops | 131 |
| loop length | 588 |
| used w registers | 6 |
| used x registers | 22 |
| used b registers | 0 |
| used h registers | 0 |
| used s registers | 1 |
| used d registers | 0 |
| used q registers | 0 |
| used v registers | 0 |
| used z registers | 4 |
| nb stack references | 6 |
| micro-operation queue | 16.38 cycles |
| front end | 16.38 cycles |
| P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 8.00 | 8.00 | 25.25 | 25.25 | 25.25 | 25.25 | 2.00 | 2.00 | 0.00 | 0.00 | 4.33 | 4.33 | 4.33 | 4.00 | 4.00 |
| cycles | 8.00 | 8.00 | 25.25 | 25.25 | 25.25 | 25.25 | 2.00 | 2.00 | 0.00 | 0.00 | 4.33 | 4.33 | 4.33 | 4.00 | 4.00 |
| Cycles executing div or sqrt instructions | 5.00-12.50 |
| Front-end | 16.38 |
| Dispatch | 25.25 |
| DIV/SQRT | 5.00-12.50 |
| Overall L1 | 25.25 |
| all | 0% |
| load | 0% |
| store | 0% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | 0% |
| fma | 0% |
| div/sqrt | 0% |
| other | 0% |
| all | 28% |
| load | 30% |
| store | 42% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | 25% |
| fma | 12% |
| div/sqrt | 12% |
| other | 28% |
| Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput | Vectorization |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| STP X29, X30, [SP, #912]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| CNTW X2, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| STP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X25, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| SUB X0, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| STP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| STP X27, X28, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| LDP X1, X26, [X25] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDR X20, [X25, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (25.0%) |
| STR X1, [X29, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (25.0%) |
| LDP X24, X22, [X25, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| UBFM X1, X24, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X3, X24, #13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X1, X1, #23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X24, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| AND X1, X1, #7932 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CCMN X3, #15, #2, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| LDR W3, [X25, #88] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (12.5%) |
| SUB SP, SP, X1,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | N/A |
| ADD X23, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| B.HI 4023d4 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x574> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADDVL X5, SP, #1 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| SUB X0, X24, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| PTRUE P7.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (100.0%) |
| MOVN X1, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, SP, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| DUP Z31.D, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | scal (3.1%) |
| ADD X5, X5, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| ADDPL X2, X6, #2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| ADD X2, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| UBFM X0, X2, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X24, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.EQ 401f30 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0xd0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| SUB X1, X0, X1,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X1, X1, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X1, X23, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| UBFM X1, X22, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CNTW X2, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| ADD X1, X1, #23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X0, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| AND X1, X1, #7932 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X22, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| SUB X4, X22, #13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| SUB SP, SP, X1,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | N/A |
| CCMN X4, #15, #2, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X21, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| B.HI 4023f4 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x594> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADDVL X5, SP, #1 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| SUB X0, X22, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| PTRUE P7.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (100.0%) |
| MOVN X1, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, SP, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| DUP Z30.D, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | scal (3.1%) |
| ADD X5, X5, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| ADDPL X2, X6, #2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| ADD X2, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| UBFM X0, X2, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X22, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.EQ 401fd0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x170> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| SUB X1, X0, X1,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X1, X1, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X1, X21, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| ADD X28, X20, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CNTD X1, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| UBFM X0, X28, #62, #61 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X1, X1, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X0, X0, #15 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X20, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| AND X0, X0, #7932 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X1, X20, #16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB SP, SP, X0,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | N/A |
| CCMN X1, #18, #2, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X27, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| B.HI 4023b0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x550> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| CNTH X2, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| SUB X0, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X20, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.CC 402434 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x5d4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADDVL X6, SP, #1 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| SUB X0, X20, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| PTRUE P7.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (100.0%) |
| MOVN X1, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, SP, #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| DUP Z29.B, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | scal (3.1%) |
| ADD X6, X6, #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADDPL X2, X5, #4 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| ADD X2, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, X27, X2,LSL #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| CMP X20, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.EQ 4020d0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x270> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| CNTD X5, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| SUB X0, X20, X2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X1, X5, #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X8, X28, X2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X0, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.CC 4020b4 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x254> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADD X0, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X7, X8, X5 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| PTRUE P7.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (100.0%) |
| ADD X0, X27, X0,LSL #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| MOVN X1, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| DUP Z28.B, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | scal (3.1%) |
| ADDPL X0, X6, #1 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| ADD X0, X0, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, X4, X0,LSL #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| ADD X2, X2, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X8, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.EQ 4020d0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x270> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| SUB X0, X4, X2,LSL #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| STR W3, [X29, #104] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (12.5%) |
| BL 401930 <@plt_start@+0x2b0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ORR W19, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| BL 401880 <@plt_start@+0x200> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| LDR W3, [X29, #104] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (12.5%) |
| ORR W1, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| SDIV W5, W3, W19 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 5-12.50 | scal (12.5%) |
| MSUB W0, W5, W19, W3 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (12.5%) |
| CMP W1, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
| B.LT 4023a4 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x544> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| B 4020d0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x270> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| B 401f30 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0xd0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| B 401fd0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x170> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MOVZ X2, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| B 402058 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x1f8> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
The code analyzed by CQA in that panel excludes loops and represents 0.00% of application time for run run_1_thread
| Source file and lines | main.cpp:138-143 |
| Module | kmeans-gcc-Ofast |
| nb instructions | 147 |
| nb uops | 131 |
| loop length | 588 |
| used w registers | 6 |
| used x registers | 22 |
| used b registers | 0 |
| used h registers | 0 |
| used s registers | 1 |
| used d registers | 0 |
| used q registers | 0 |
| used v registers | 0 |
| used z registers | 4 |
| nb stack references | 6 |
| micro-operation queue | 16.38 cycles |
| front end | 16.38 cycles |
| P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 8.00 | 8.00 | 25.25 | 25.25 | 25.25 | 25.25 | 2.00 | 2.00 | 0.00 | 0.00 | 4.33 | 4.33 | 4.33 | 4.00 | 4.00 |
| cycles | 8.00 | 8.00 | 25.25 | 25.25 | 25.25 | 25.25 | 2.00 | 2.00 | 0.00 | 0.00 | 4.33 | 4.33 | 4.33 | 4.00 | 4.00 |
| Cycles executing div or sqrt instructions | 5.00-12.50 |
| Front-end | 16.38 |
| Dispatch | 25.25 |
| DIV/SQRT | 5.00-12.50 |
| Overall L1 | 25.25 |
| all | 0% |
| load | 0% |
| store | 0% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | 0% |
| fma | 0% |
| div/sqrt | 0% |
| other | 0% |
| all | 28% |
| load | 30% |
| store | 42% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | 25% |
| fma | 12% |
| div/sqrt | 12% |
| other | 28% |
| Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput | Vectorization |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| STP X29, X30, [SP, #912]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| CNTW X2, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| STP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X25, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| SUB X0, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| STP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| STP X27, X28, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| LDP X1, X26, [X25] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDR X20, [X25, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (25.0%) |
| STR X1, [X29, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (25.0%) |
| LDP X24, X22, [X25, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| UBFM X1, X24, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X3, X24, #13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X1, X1, #23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X24, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| AND X1, X1, #7932 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CCMN X3, #15, #2, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| LDR W3, [X25, #88] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (12.5%) |
| SUB SP, SP, X1,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | N/A |
| ADD X23, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| B.HI 4023d4 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x574> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADDVL X5, SP, #1 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| SUB X0, X24, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| PTRUE P7.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (100.0%) |
| MOVN X1, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, SP, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| DUP Z31.D, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | scal (3.1%) |
| ADD X5, X5, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| ADDPL X2, X6, #2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| ADD X2, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| UBFM X0, X2, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X24, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.EQ 401f30 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0xd0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| SUB X1, X0, X1,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X1, X1, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X1, X23, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| UBFM X1, X22, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CNTW X2, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| ADD X1, X1, #23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X0, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| AND X1, X1, #7932 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X22, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| SUB X4, X22, #13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| SUB SP, SP, X1,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | N/A |
| CCMN X4, #15, #2, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X21, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| B.HI 4023f4 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x594> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADDVL X5, SP, #1 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| SUB X0, X22, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| PTRUE P7.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (100.0%) |
| MOVN X1, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, SP, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| DUP Z30.D, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | scal (3.1%) |
| ADD X5, X5, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| ADDPL X2, X6, #2 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| ADD X2, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| UBFM X0, X2, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X22, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.EQ 401fd0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x170> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| SUB X1, X0, X1,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X1, X1, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X1, X21, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| ADD X28, X20, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CNTD X1, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| UBFM X0, X28, #62, #61 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X1, X1, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X0, X0, #15 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X20, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| AND X0, X0, #7932 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X1, X20, #16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB SP, SP, X0,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | N/A |
| CCMN X1, #18, #2, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X27, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| B.HI 4023b0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x550> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| CNTH X2, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| SUB X0, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X20, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.CC 402434 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x5d4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADDVL X6, SP, #1 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| SUB X0, X20, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| PTRUE P7.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (100.0%) |
| MOVN X1, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, SP, #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| DUP Z29.B, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | scal (3.1%) |
| ADD X6, X6, #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADDPL X2, X5, #4 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| ADD X2, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, X27, X2,LSL #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| CMP X20, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.EQ 4020d0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x270> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| CNTD X5, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| SUB X0, X20, X2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X1, X5, #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X8, X28, X2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X0, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.CC 4020b4 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x254> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADD X0, X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| SUB X7, X8, X5 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| PTRUE P7.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (100.0%) |
| ADD X0, X27, X0,LSL #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| MOVN X1, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| DUP Z28.B, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | scal (3.1%) |
| ADDPL X0, X6, #1 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (25.0%) |
| ADD X0, X0, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, X4, X0,LSL #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| ADD X2, X2, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| CMP X8, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (25.0%) |
| B.EQ 4020d0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x270> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| SUB X0, X4, X2,LSL #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| STR W3, [X29, #104] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (12.5%) |
| BL 401930 <@plt_start@+0x2b0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ORR W19, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| BL 401880 <@plt_start@+0x200> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| LDR W3, [X29, #104] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (12.5%) |
| ORR W1, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| SDIV W5, W3, W19 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 5-12.50 | scal (12.5%) |
| MSUB W0, W5, W19, W3 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (12.5%) |
| CMP W1, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
| B.LT 4023a4 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x544> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| B 4020d0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x270> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| B 401f30 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0xd0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| B 401fd0 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x170> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MOVZ X2, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADD X4, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| B 402058 <_Z7k_meansiP7point_tS0_Piii._omp_fn.1+0x1f8> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| Run run_1_thread | Number processes: 1Number nodes: 1Run Command: <executable> kmeans/input/100000000.in 1000 100000000 50 25MPI Command: Dataset: Run Directory: /home/fmusial/KMEANS_BenchmarksOMP_PROC_BIND: closeOMP_NUM_THREADS: 1OMP_PLACES: cores |
|---|---|
| Run run_2_threads | Number processes: 1Number nodes: 1Run Command: <executable> kmeans/input/100000000.in 1000 100000000 50 25MPI Command: Dataset: Run Directory: /home/fmusial/KMEANS_BenchmarksOMP_PLACES: coresOMP_PROC_BIND: closeOMP_NUM_THREADS: 2 |
| Run run_4_threads | Number processes: 1Number nodes: 1Run Command: <executable> kmeans/input/100000000.in 1000 100000000 50 25MPI Command: Dataset: Run Directory: /home/fmusial/KMEANS_BenchmarksOMP_PLACES: coresOMP_PROC_BIND: closeOMP_NUM_THREADS: 4 |
| Run run_8_threads | Number processes: 1Number nodes: 1Run Command: <executable> kmeans/input/100000000.in 1000 100000000 50 25MPI Command: Dataset: Run Directory: /home/fmusial/KMEANS_BenchmarksOMP_PLACES: coresOMP_PROC_BIND: closeOMP_NUM_THREADS: 8 |
| Run run_16_threads | Number processes: 1Number nodes: 1Run Command: <executable> kmeans/input/100000000.in 1000 100000000 50 25MPI Command: Dataset: Run Directory: /home/fmusial/KMEANS_BenchmarksOMP_PLACES: coresOMP_PROC_BIND: closeOMP_NUM_THREADS: 16 |
| Run run_32_threads | Number processes: 1Number nodes: 1Run Command: <executable> kmeans/input/100000000.in 1000 100000000 50 25MPI Command: Dataset: Run Directory: /home/fmusial/KMEANS_BenchmarksOMP_PROC_BIND: closeOMP_PLACES: coresOMP_NUM_THREADS: 32 |
| Run run_64_threads | Number processes: 1Number nodes: 1Run Command: <executable> kmeans/input/100000000.in 1000 100000000 50 25MPI Command: Dataset: Run Directory: /home/fmusial/KMEANS_BenchmarksOMP_PROC_BIND: closeOMP_PLACES: coresOMP_NUM_THREADS: 64 |
| (run_1_thread) Efficiency | (run_1_thread) Potential Speed-Up (%) | (run_2_threads) Efficiency | (run_2_threads) Potential Speed-Up (%) | (run_4_threads) Efficiency | (run_4_threads) Potential Speed-Up (%) | (run_8_threads) Efficiency | (run_8_threads) Potential Speed-Up (%) | (run_16_threads) Efficiency | (run_16_threads) Potential Speed-Up (%) | (run_32_threads) Efficiency | (run_32_threads) Potential Speed-Up (%) | (run_64_threads) Efficiency | (run_64_threads) Potential Speed-Up (%) |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1 | 0 | 1.19 | 0 | 0.25 | 0.05 | 0.14 | 0.1 | 0.04 | 0.41 | 0.01 | 2.18 | 0 | 12.41 |
| Run | Number of threads | Efficiency (ideal is 1) | Speedup | Ideal Speedup | Time (s) | Coverage (%) |
|---|---|---|---|---|---|---|
| run_1_thread | 1 | 1 | 1 | 1 | 0.029999997466803 | 0.016349220648408 |
| run_2_threads | 1 | 1.19 | 2.39 | 2 | 0.024999994784594 | 0.013578470796347 |
| run_4_threads | 4 | 0.25 | 0.99 | 4 | 0.044999998062849 | 0.064996615052223 |
| run_8_threads | 8 | 0.14 | 1.1 | 8 | 0.054999999701977 | 0.11408393830061 |
| run_16_threads | 16 | 0.04 | 0.6 | 16 | 0.089999988675117 | 0.42092603445053 |
| run_32_threads | 32 | 0.01 | 0.21 | 32 | 0.2149999588728 | 2.1973106861115 |
| run_64_threads | 64 | 0 | 0.09 | 64 | 0.20499995350838 | 12.426350593567 |
| Name | Coverage (%) | Time (s) |
|---|---|---|
| ▼k_means(int, point_t*, point_t*, int*, int, int) [clone ._omp_fn.1]– | 0.02 | 0.03 |
| ○Loop 6 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 5 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 18 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 22 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ▼Loop 10 - main.cpp:138-143 - kmeans-gcc-Ofast– | 0.00 | 0.00 |
| ○Loop 15 - main.cpp:140-143 - kmeans-gcc-Ofast | 0.02 | 0.03 |
| ○Loop 8 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 11 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 14 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 9 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 12 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 7 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 13 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 16 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 21 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 19 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 20 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 4 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
| ○Loop 17 - main.cpp:138-138 - kmeans-gcc-Ofast | 0.00 | 0.00 |
