Function: qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSe ... | Module: exec | Source: SoaDistanceTableABOMPTarget.h:184-233 [...] | Coverage: 4.21% |
---|
Function: qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSe ... | Module: exec | Source: SoaDistanceTableABOMPTarget.h:184-233 [...] | Coverage: 4.21% |
---|
/usr/lib/gcc/aarch64-linux-gnu/12/../../../../include/c++/12/bits/stl_vector.h: 1124 - 1124 |
-------------------------------------------------------------------------------- |
1124: return *(this->_M_impl._M_start + __n); |
/home/hbollore/qaas-runs/171-284-6744/intel/miniqmc/build/miniqmc/src/Platforms/OMPTarget/OMPTargetMath.hpp: 38 - 38 |
-------------------------------------------------------------------------------- |
38: return a < b ? a : b; |
/home/hbollore/qaas-runs/171-284-6744/intel/miniqmc/build/miniqmc/src/Particle/Lattice/ParticleBConds3DSoa.h: 280 - 298 |
-------------------------------------------------------------------------------- |
280: T displ_0 = px[iat] - x0; |
281: T displ_1 = py[iat] - y0; |
282: T displ_2 = pz[iat] - z0; |
283: |
284: T ar_0 = displ_0 * g00 + displ_1 * g10 + displ_2 * g20; |
285: T ar_1 = displ_0 * g01 + displ_1 * g11 + displ_2 * g21; |
286: T ar_2 = displ_0 * g02 + displ_1 * g12 + displ_2 * g22; |
287: |
288: //put them in the box |
289: ar_0 -= round(ar_0); |
290: ar_1 -= round(ar_1); |
291: ar_2 -= round(ar_2); |
292: |
293: //unit2cart |
294: dx[iat] = ar_0 * r00 + ar_1 * r10 + ar_2 * r20; |
295: dy[iat] = ar_0 * r01 + ar_1 * r11 + ar_2 * r21; |
296: dz[iat] = ar_0 * r02 + ar_1 * r12 + ar_2 * r22; |
297: |
298: temp_r[iat] = std::sqrt(dx[iat] * dx[iat] + dy[iat] * dy[iat] + dz[iat] * dz[iat]); |
/home/hbollore/qaas-runs/171-284-6744/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/VectorSoAContainer.h: 267 - 267 |
-------------------------------------------------------------------------------- |
267: inline const T* data() const { return myData; } |
/usr/lib/gcc/aarch64-linux-gnu/12/../../../../include/c++/12/bits/unique_ptr.h: 191 - 191 |
-------------------------------------------------------------------------------- |
191: pointer _M_ptr() const noexcept { return std::get<0>(_M_t); } |
/home/hbollore/qaas-runs/171-284-6744/intel/miniqmc/build/miniqmc/src/Utilities/NewTimer.h: 242 - 249 |
-------------------------------------------------------------------------------- |
242: ScopeGuard(TIMER& t) : timer(t) { timer.start(); } |
[...] |
249: ~ScopeGuard() { timer.stop(); } |
/home/hbollore/qaas-runs/171-284-6744/intel/miniqmc/build/miniqmc/src/Particle/SoaDistanceTableABOMPTarget.h: 184 - 233 |
-------------------------------------------------------------------------------- |
184: { |
185: resize(); |
186: |
187: ScopedTimer local_timer(evaluate_timer_); |
188: // be aware of the sign of Displacement |
189: const int num_targets_local = num_targets_; |
190: const int num_sources_local = num_sources_; |
191: const int num_padded = getAlignedSize<T>(num_sources_); |
192: |
193: target_pos.resize(num_targets_ * D); |
194: for (size_t iat = 0; iat < num_targets_; iat++) |
195: for (size_t idim = 0; idim < D; idim++) |
196: target_pos[iat * D + idim] = P.R[iat][idim]; |
197: |
198: auto* target_pos_ptr = target_pos.data(); |
199: auto* source_pos_ptr = origin_.getCoordinates().getAllParticlePos().data(); |
[...] |
205: const size_t num_teams = (num_sources_ + ChunkSizePerTeam - 1) / ChunkSizePerTeam; |
206: const size_t stride_size = getPerTargetPctlStrideSize(); |
207: |
208: { |
209: ScopedTimer offload(offload_timer_); |
210: PRAGMA_OFFLOAD("omp target teams distribute collapse(2) num_teams(num_targets_*num_teams) \ |
211: map(to: source_pos_ptr[:num_padded*D]) \ |
212: map(always, to: target_pos_ptr[:num_targets_*D]) \ |
213: map(always, from: r_dr_ptr[:num_targets_*stride_size])") |
214: for (int iat = 0; iat < num_targets_local; ++iat) |
215: for (int team_id = 0; team_id < num_teams; team_id++) |
216: { |
217: const int first = ChunkSizePerTeam * team_id; |
[...] |
228: for (int iel = first; iel < last; iel++) |
229: DTD_BConds<T, D, SC>::computeDistancesOffload(pos, source_pos_ptr, num_padded, r_iat_ptr, dr_iat_ptr, |
230: num_padded, iel); |
231: } |
232: } |
233: } |
/home/hbollore/qaas-runs/171-284-6744/intel/miniqmc/build/miniqmc/src/Numerics/OhmmsPETE/OhmmsVector.h: 223 - 248 |
-------------------------------------------------------------------------------- |
223: return X[i]; |
[...] |
248: inline pointer data() { return X; } |
0x4a27e0 STP D15, D14, [SP, #864]! |
0x4a27e4 STP D13, D12, [SP, #16] |
0x4a27e8 STP D11, D10, [SP, #32] |
0x4a27ec STP D9, D8, [SP, #48] |
0x4a27f0 STP X29, X30, [SP, #64] |
0x4a27f4 STP X28, X27, [SP, #80] |
0x4a27f8 STP X26, X25, [SP, #96] |
0x4a27fc STP X24, X23, [SP, #112] |
0x4a2800 STP X22, X21, [SP, #128] |
0x4a2804 STP X20, X19, [SP, #144] |
0x4a2808 ADD X29, SP, #64 |
0x4a280c ADDVL SP, SP, #46 |
0x4a2810 SUB SP, SP, #288 |
0x4a2814 ORR X21, XZR, X1 |
0x4a2818 ORR X24, XZR, X0 |
0x4a281c BL 4a4500 |
0x4a2820 LDR X20, [X24, #440] |
0x4a2824 ORR X0, XZR, X20 |
0x4a2828 BL 46c620 |
0x4a282c LDP X23, X27, [X24, #16] |
0x4a2830 ADD X0, X24, #384 |
0x4a2834 ADD X1, X27, X27,LSL #1 |
0x4a2838 MOVI D0, #0 |
0x4a283c BL 43e8c0 |
0x4a2840 LDR X9, [X24, #24] |
0x4a2844 CBZ X9, 4a28b0 |
0x4a2848 CNTW X10, ALL |
0x4a284c LDR X8, [X21, #64] |
0x4a2850 LDR X3, [X24, #408] |
0x4a2854 MOVZ W11, #32 |
0x4a2858 CMP X10, #32 |
0x4a285c CSEL X11, X10, X11, #8 |
0x4a2860 CMP X9, X11 |
0x4a2864 ORR X11, XZR, XZR |
0x4a2868 STR X3, [SP, #208] |
0x4a286c B.CS 4a2fc8 |
(2731) 0x4a2870 ADD X10, X11, X11,LSL #1 |
(2731) 0x4a2874 SUB X9, X9, X11 |
(2731) 0x4a2878 UBFM X10, X10, #61, #60 |
(2731) 0x4a287c HINT #0 |
(2730) 0x4a2880 ADD X11, X8, X10 |
(2730) 0x4a2884 ADD X12, X3, X10 |
(2730) 0x4a2888 SUBS X9, X9, #1 |
(2730) 0x4a288c ADD X10, X10, #24 |
(2730) 0x4a2890 LDR D0, [X11] |
(2730) 0x4a2894 STR D0, [X12] |
(2730) 0x4a2898 LDR D0, [X11, #8] |
(2730) 0x4a289c STR D0, [X12, #8] |
(2730) 0x4a28a0 LDR D0, [X11, #16] |
(2730) 0x4a28a4 STR D0, [X12, #16] |
(2730) 0x4a28a8 B.NE 4a2880 |
(2731) 0x4a28ac B 4a28b8 |
0x4a28b0 LDR X8, [X24, #408] |
0x4a28b4 STR X8, [SP, #208] |
(2731) 0x4a28b8 LDR X8, [X24, #8] |
(2731) 0x4a28bc LDR X0, [X8, #632] |
(2731) 0x4a28c0 LDR X8, [X0] |
(2731) 0x4a28c4 LDR X8, [X8, #72] |
(2731) 0x4a28c8 BLR X8 |
(2731) 0x4a28cc LDR X8, [X24, #72] |
(2731) 0x4a28d0 LDR X21, [X0, #24] |
(2731) 0x4a28d4 LDR X19, [X24, #16] |
(2731) 0x4a28d8 LDR X8, [X8, #24] |
(2731) 0x4a28dc STR X8, [SP, #104] |
(2731) 0x4a28e0 LDR X8, [X24] |
(2731) 0x4a28e4 LDR X8, [X8, #136] |
(2731) 0x4a28e8 ORR X0, XZR, X24 |
(2731) 0x4a28ec BLR X8 |
(2731) 0x4a28f0 LDR X25, [X24, #432] |
(2731) 0x4a28f4 ORR X22, XZR, X0 |
(2731) 0x4a28f8 ORR X0, XZR, X25 |
(2731) 0x4a28fc BL 46c620 |
(2731) 0x4a2900 LDR X5, [SP, #208] |
(2731) 0x4a2904 CMP W27, #1 |
(2731) 0x4a2908 B.LT 4a3060 |
(2731) 0x4a290c ADD X8, X19, #511 |
(2731) 0x4a2910 CMP X8, #512 |
(2731) 0x4a2914 B.CC 4a3060 |
(2732) 0x4a2918 ADD X9, X23, #3 |
(2732) 0x4a291c AND X11, X27, #6080 |
(2732) 0x4a2920 UBFM X8, X8, #9, #63 |
(2732) 0x4a2924 LDR X7, [SP, #104] |
(2732) 0x4a2928 UBFM X17, X22, #61, #60 |
(2732) 0x4a292c STP X25, X20, [SP, #16] |
(2732) 0x4a2930 STP X11, X24, [SP, #88] |
(2732) 0x4a2934 ORR X12, XZR, XZR |
(2732) 0x4a2938 AND X9, X9, #8062 |
(2732) 0x4a293c CMP X8, #1 |
(2732) 0x4a2940 PTRUE P0.D, ALL |
(2732) 0x4a2944 STR X23, [SP, #200] |
(2732) 0x4a2948 UBFM W10, W9, #31, #30 |
(2732) 0x4a294c UBFM X14, X9, #32, #31 |
(2732) 0x4a2950 SBFM X15, X9, #0, #31 |
(2732) 0x4a2954 ADD X11, X21, W9,SXTW #3 |
(2732) 0x4a2958 CSINC X0, X8, XZR, #8 |
(2732) 0x4a295c SBFM X16, X10, #0, #31 |
(2732) 0x4a2960 ADD X13, X21, W10,SXTW #3 |
(2732) 0x4a2964 SBFM X10, X14, #29, #63 |
(2732) 0x4a2968 STP X10, X17, [SP, #72] |
(2732) 0x4a296c SBFM X9, X14, #28, #63 |
(2732) 0x4a2970 ORR X14, X10, #4157 |
(2732) 0x4a2974 UBFM X8, X15, #61, #60 |
(2732) 0x4a2978 ADD X3, X7, X8 |
(2732) 0x4a297c STP X14, X9, [SP, #56] |
(2732) 0x4a2980 ORR X9, X9, #4157 |
(2732) 0x4a2984 ADD X2, X7, X15,LSL #4 |
(2732) 0x4a2988 STR X9, [SP, #48] |
(2732) 0x4a298c UBFM X9, X16, #61, #60 |
(2732) 0x4a2990 ADD X10, X9, X10 |
(2732) 0x4a2994 ADD X9, X9, X8 |
(2732) 0x4a2998 RDVL X8, #1 |
(2732) 0x4a299c ADD X20, X7, X9 |
(2732) 0x4a29a0 STR X10, [SP, #40] |
(2732) 0x4a29a4 ORR X10, X10, #4157 |
(2732) 0x4a29a8 UBFM X8, X8, #4, #63 |
(2732) 0x4a29ac STR X10, [SP, #32] |
(2732) 0x4a29b0 STR X8, [SP, #120] |
(2732) 0x4a29b4 B 4a29e8 |
0x4a29b8 HINT #0 |
0x4a29bc HINT #0 |
(2732) 0x4a29c0 LDR X12, [SP, #112] |
(2732) 0x4a29c4 LDP X17, X8, [SP, #80] |
(2732) 0x4a29c8 LDR X24, [SP, #96] |
(2732) 0x4a29cc ADD X12, X12, #1 |
(2732) 0x4a29d0 ADD X7, X7, X17 |
(2732) 0x4a29d4 ADD X20, X20, X17 |
(2732) 0x4a29d8 ADD X2, X2, X17 |
(2732) 0x4a29dc ADD X3, X3, X17 |
(2732) 0x4a29e0 CMP X12, X8 |
(2732) 0x4a29e4 B.EQ 4a305c |
(2732) 0x4a29e8 MADD X8, X17, X12, XZR |
(2732) 0x4a29ec STR X12, [SP, #112] |
(2732) 0x4a29f0 ADD W17, W12, W12,LSL #1 |
(2732) 0x4a29f4 LDR X12, [SP, #56] |
(2732) 0x4a29f8 LDP D0, D1, [X24, #280] |
(2732) 0x4a29fc ORR X22, XZR, XZR |
(2732) 0x4a2a00 MOVZ W19, #512 |
(2732) 0x4a2a04 LDP D2, D3, [X24, #296] |
(2732) 0x4a2a08 LDP D4, D5, [X24, #312] |
(2732) 0x4a2a0c ORR X27, XZR, XZR |
(2732) 0x4a2a10 ORR X14, XZR, XZR |
(2732) 0x4a2a14 LDP D6, D7, [X24, #328] |
(2732) 0x4a2a18 LDP D17, D18, [X24, #200] |
(2732) 0x4a2a1c LDP D19, D20, [X24, #216] |
(2732) 0x4a2a20 ORR X25, XZR, X21 |
(2732) 0x4a2a24 ORR X9, XZR, X11 |
(2732) 0x4a2a28 LDP D21, D16, [X24, #232] |
(2732) 0x4a2a2c LDP D22, D23, [X24, #248] |
(2732) 0x4a2a30 ORR X16, XZR, X13 |
(2732) 0x4a2a34 DUP Z27.D, Z20.D[0] |
(2732) 0x4a2a38 ADD X15, X12, X8 |
(2732) 0x4a2a3c LDP X12, X10, [SP, #64] |
(2732) 0x4a2a40 ADD X10, X10, X8 |
(2732) 0x4a2a44 LDP D25, D24, [X24, #264] |
(2732) 0x4a2a48 DUP Z13.D, Z16.D[0] |
(2732) 0x4a2a4c DUP Z10.D, Z23.D[0] |
(2732) 0x4a2a50 DUP Z15.D, Z24.D[0] |
(2732) 0x4a2a54 DUP Z28.D, Z7.D[0] |
(2732) 0x4a2a58 DUP Z14.D, Z18.D[0] |
(2732) 0x4a2a5c DUP Z26.D, Z0.D[0] |
(2732) 0x4a2a60 DUP Z12.D, Z19.D[0] |
(2732) 0x4a2a64 DUP Z9.D, Z22.D[0] |
(2732) 0x4a2a68 DUP Z11.D, Z25.D[0] |
(2732) 0x4a2a6c DUP Z29.D, Z17.D[0] |
(2732) 0x4a2a70 ORR X6, XZR, X3 |
(2732) 0x4a2a74 CNTD X24, ALL |
(2732) 0x4a2a78 ADD X18, X12, X8 |
(2732) 0x4a2a7c LDR X12, [SP, #48] |
(2732) 0x4a2a80 ADD X1, X12, X8 |
(2732) 0x4a2a84 LDR X12, [SP, #40] |
(2732) 0x4a2a88 ADD X4, X12, X8 |
(2732) 0x4a2a8c LDR X12, [SP, #32] |
(2732) 0x4a2a90 ADD X8, X12, X8 |
(2732) 0x4a2a94 ADD W12, W17, #1 |
(2732) 0x4a2a98 STP X12, X17, [SP, #272] |
(2732) 0x4a2a9c ADD W12, W17, #2 |
(2732) 0x4a2aa0 STR X12, [SP, #264] |
(2732) 0x4a2aa4 LDR X12, [SP, #104] |
(2732) 0x4a2aa8 ADD X10, X12, X10 |
(2732) 0x4a2aac ADD X8, X12, X8 |
(2732) 0x4a2ab0 STR X10, [SP, #256] |
(2732) 0x4a2ab4 ADD X10, X12, X15 |
(2732) 0x4a2ab8 ORR X15, XZR, X7 |
(2732) 0x4a2abc STR X10, [SP, #248] |
(2732) 0x4a2ac0 ADD X10, X12, X18 |
(2732) 0x4a2ac4 STR X10, [SP, #240] |
(2732) 0x4a2ac8 ADD X10, X12, X1 |
(2732) 0x4a2acc ORR X1, XZR, X20 |
(2732) 0x4a2ad0 STR X10, [SP, #232] |
(2732) 0x4a2ad4 ADD X10, X12, X4 |
(2732) 0x4a2ad8 STP X8, X10, [SP, #216] |
(2732) 0x4a2adc SUB X8, X29, #64 |
(2732) 0x4a2ae0 SUB X10, X29, #64 |
(2732) 0x4a2ae4 STR Z26, [X8, #498, MUL VL] |
(2732) 0x4a2ae8 DUP Z26.D, Z1.D[0] |
(2732) 0x4a2aec SUB X8, X29, #64 |
(2732) 0x4a2af0 STR Z26, [X8, #497, MUL VL] |
(2732) 0x4a2af4 DUP Z26.D, Z2.D[0] |
(2732) 0x4a2af8 SUB X8, X29, #64 |
(2732) 0x4a2afc STR Z26, [X8, #496, MUL VL] |
(2732) 0x4a2b00 DUP Z26.D, Z3.D[0] |
(2732) 0x4a2b04 SUB X8, X29, #64 |
(2732) 0x4a2b08 STR Z26, [X8, #495, MUL VL] |
(2732) 0x4a2b0c DUP Z26.D, Z4.D[0] |
(2732) 0x4a2b10 SUB X8, X29, #64 |
(2732) 0x4a2b14 STR Z26, [X8, #494, MUL VL] |
(2732) 0x4a2b18 DUP Z26.D, Z5.D[0] |
(2732) 0x4a2b1c SUB X8, X29, #64 |
(2732) 0x4a2b20 STR Z26, [X8, #504, MUL VL] |
(2732) 0x4a2b24 DUP Z26.D, Z6.D[0] |
(2732) 0x4a2b28 SUB X8, X29, #64 |
(2732) 0x4a2b2c STR Z26, [X8, #503, MUL VL] |
(2732) 0x4a2b30 DUP Z26.D, Z21.D[0] |
(2732) 0x4a2b34 ORR X8, XZR, X2 |
(2732) 0x4a2b38 STP D1, D0, [SP, #184] |
(2732) 0x4a2b3c STP D3, D2, [SP, #168] |
(2732) 0x4a2b40 STP D5, D4, [SP, #152] |
(2732) 0x4a2b44 STP D7, D6, [SP, #136] |
(2732) 0x4a2b48 STR Z12, [X10, #511, MUL VL] |
(2732) 0x4a2b4c SUB X10, X29, #64 |
(2732) 0x4a2b50 STR Z27, [X10, #510, MUL VL] |
(2732) 0x4a2b54 SUB X10, X29, #64 |
(2732) 0x4a2b58 STR Z26, [X10, #509, MUL VL] |
(2732) 0x4a2b5c SUB X10, X29, #64 |
(2732) 0x4a2b60 STR Z13, [X10, #502, MUL VL] |
(2732) 0x4a2b64 SUB X10, X29, #64 |
(2732) 0x4a2b68 STR Z9, [X10, #501, MUL VL] |
(2732) 0x4a2b6c SUB X10, X29, #64 |
(2732) 0x4a2b70 STR Z10, [X10, #500, MUL VL] |
(2732) 0x4a2b74 SUB X10, X29, #64 |
(2732) 0x4a2b78 STR Z11, [X10, #499, MUL VL] |
(2732) 0x4a2b7c SUB X10, X29, #64 |
(2732) 0x4a2b80 STR D22, [SP, #128] |
(2732) 0x4a2b84 STR Z14, [X10, #508, MUL VL] |
(2732) 0x4a2b88 B 4a2bc0 |
(2733) 0x4a2b8c ADD X27, X27, #1 |
(2733) 0x4a2b90 ADD X14, X14, #512 |
(2733) 0x4a2b94 ADD X15, X15, #1 |
(2733) 0x4a2b98 ADD X1, X1, #1 |
(2733) 0x4a2b9c ADD X8, X8, #1 |
(2733) 0x4a2ba0 ADD X6, X6, #1 |
(2733) 0x4a2ba4 ADD X16, X16, #1 |
(2733) 0x4a2ba8 ADD X9, X9, #1 |
(2733) 0x4a2bac ADD X25, X25, #1 |
(2733) 0x4a2bb0 SUB X22, X22, #512 |
(2733) 0x4a2bb4 ADD W19, W19, #512 |
(2733) 0x4a2bb8 CMP X27, X0 |
(2733) 0x4a2bbc B.EQ 4a29c0 |
(2733) 0x4a2bc0 CMP W19, W23 |
(2733) 0x4a2bc4 ADD W18, W14, #512 |
(2733) 0x4a2bc8 UBFM X4, X27, #55, #54 |
(2733) 0x4a2bcc CSEL W10, W19, W23, #11 |
(2733) 0x4a2bd0 CMP W18, W23 |
(2733) 0x4a2bd4 CSEL W26, W18, W23, #11 |
(2733) 0x4a2bd8 ADD W18, W4, #512 |
(2733) 0x4a2bdc CMP W18, W23 |
(2733) 0x4a2be0 CSEL W18, W18, W23, #11 |
(2733) 0x4a2be4 SBFM X18, X18, #0, #31 |
(2733) 0x4a2be8 CMP X4, X18 |
(2733) 0x4a2bec B.GE 4a2b8c |
(2733) 0x4a2bf0 LDR X12, [SP, #280] |
(2733) 0x4a2bf4 SBFM X30, X26, #0, #31 |
(2733) 0x4a2bf8 CMP X24, #4 |
(2733) 0x4a2bfc SUB X26, X30, X4 |
(2733) 0x4a2c00 LDR D30, [X5, X12,LSL #3] |
(2733) 0x4a2c04 LDR X12, [SP, #272] |
(2733) 0x4a2c08 LDR D31, [X5, X12,LSL #3] |
(2733) 0x4a2c0c LDR X12, [SP, #264] |
(2733) 0x4a2c10 LDR D8, [X5, X12,LSL #3] |
(2733) 0x4a2c14 MOVZ W12, #4 |
(2733) 0x4a2c18 CSEL X28, X24, X12, #8 |
(2733) 0x4a2c1c CMP X26, X28 |
(2733) 0x4a2c20 ORR X28, XZR, X14 |
(2733) 0x4a2c24 B.CC 4a2ea0 |
(2733) 0x4a2c28 LDR X12, [SP, #256] |
(2733) 0x4a2c2c UBFM X28, X27, #52, #51 |
(2733) 0x4a2c30 ORR X23, XZR, X0 |
(2733) 0x4a2c34 ORN X4, XZR, X4 |
(2733) 0x4a2c38 ADD X4, X4, X30 |
(2733) 0x4a2c3c ADD X17, X12, X28 |
(2733) 0x4a2c40 LDR X12, [SP, #248] |
(2733) 0x4a2c44 UBFM X4, X4, #61, #60 |
(2733) 0x4a2c48 ADD X0, X12, X28 |
(2733) 0x4a2c4c LDR X12, [SP, #240] |
(2733) 0x4a2c50 ADD X0, X0, X4 |
(2733) 0x4a2c54 ADD X24, X12, X28 |
(2733) 0x4a2c58 LDP X5, X12, [SP, #224] |
(2733) 0x4a2c5c ADD X30, X12, X28 |
(2733) 0x4a2c60 ADD X5, X5, X28 |
(2733) 0x4a2c64 ADD X12, X30, X4 |
(2733) 0x4a2c68 LDR X30, [SP, #216] |
(2733) 0x4a2c6c ADD X28, X30, X28 |
(2733) 0x4a2c70 ADD X4, X28, X4 |
(2733) 0x4a2c74 ORR X28, XZR, X14 |
(2733) 0x4a2c78 CMP X17, X4 |
(2733) 0x4a2c7c CCMP X5, X0, #2, #3 |
(2733) 0x4a2c80 CSINC W30, WZR, WZR, #2 |
(2733) 0x4a2c84 CMP X24, X4 |
(2733) 0x4a2c88 CCMP X5, X12, #2, #3 |
(2733) 0x4a2c8c CSINC W4, WZR, WZR, #2 |
(2733) 0x4a2c90 CMP X24, X0 |
(2733) 0x4a2c94 ORR X0, XZR, X23 |
(2733) 0x4a2c98 CNTD X24, ALL |
(2733) 0x4a2c9c LDP X23, X5, [SP, #200] |
(2733) 0x4a2ca0 CCMP X17, X12, #2, #3 |
(2733) 0x4a2ca4 B.CC 4a2ea0 |
(2733) 0x4a2ca8 ORR X28, XZR, X14 |
(2733) 0x4a2cac TBNZ W30, #0, 4a2ea0 |
(2733) 0x4a2cb0 ORR X28, XZR, X14 |
(2733) 0x4a2cb4 TBNZ W4, #0, 4a2ea0 |
(2733) 0x4a2cb8 ADD X12, X22, W10,SXTW |
(2733) 0x4a2cbc UDIV X10, X26, X24 |
(2733) 0x4a2cc0 DUP Z0.D, Z30.D[0] |
(2733) 0x4a2cc4 ORR Z6.D, Z29.D, Z29.D |
(2733) 0x4a2cc8 ORR Z5.D, Z28.D, Z28.D |
(2733) 0x4a2ccc ORR X4, XZR, XZR |
(2733) 0x4a2cd0 ORR Z22.D, Z11.D, Z11.D |
(2733) 0x4a2cd4 ORR Z11.D, Z10.D, Z10.D |
(2733) 0x4a2cd8 ORR Z10.D, Z9.D, Z9.D |
(2733) 0x4a2cdc ORR Z9.D, Z13.D, Z13.D |
(2733) 0x4a2ce0 MADD X17, X10, X24, XZR |
(2733) 0x4a2ce4 UDIV X12, X12, X24 |
(2733) 0x4a2ce8 SUB X10, X26, X17 |
(2733) 0x4a2cec ADD X28, X14, X17 |
(2733) 0x4a2cf0 SUB X17, X29, #64 |
(2733) 0x4a2cf4 STR Z0, [X17, #507, MUL VL] |
(2733) 0x4a2cf8 DUP Z0.D, Z31.D[0] |
(2733) 0x4a2cfc SUB X17, X29, #64 |
(2733) 0x4a2d00 STR Z0, [X17, #506, MUL VL] |
(2733) 0x4a2d04 DUP Z0.D, Z8.D[0] |
(2733) 0x4a2d08 SUB X17, X29, #64 |
(2733) 0x4a2d0c STR Z0, [X17, #505, MUL VL] |
(2733) 0x4a2d10 LDR X17, [SP, #120] |
(2733) 0x4a2d14 MADD X12, X17, X12, XZR |
(2733) 0x4a2d18 UBFM X26, X12, #63, #62 |
(2733) 0x4a2d1c SUB X12, X29, #64 |
(2733) 0x4a2d20 LDR Z0, [X12, #496, MUL VL] |
(2733) 0x4a2d24 SUB X12, X29, #64 |
(2733) 0x4a2d28 LDR Z29, [X12, #497, MUL VL] |
(2733) 0x4a2d2c SUB X12, X29, #64 |
(2733) 0x4a2d30 LDR Z28, [X12, #498, MUL VL] |
(2733) 0x4a2d34 SUB X12, X29, #64 |
(2733) 0x4a2d38 LDR Z1, [X12, #495, MUL VL] |
(2733) 0x4a2d3c SUB X12, X29, #64 |
(2733) 0x4a2d40 LDR Z2, [X12, #494, MUL VL] |
(2733) 0x4a2d44 SUB X12, X29, #64 |
(2733) 0x4a2d48 LDR Z3, [X12, #504, MUL VL] |
(2733) 0x4a2d4c SUB X12, X29, #64 |
(2733) 0x4a2d50 LDR Z4, [X12, #503, MUL VL] |
(2733) 0x4a2d54 HINT #0 |
(2733) 0x4a2d58 HINT #0 |
(2733) 0x4a2d5c HINT #0 |
(2735) 0x4a2d60 SUB X12, X29, #64 |
(2735) 0x4a2d64 LD1D {Z12.D}, P0/Z, [X25, X4,LSL #3] |
(2735) 0x4a2d68 ORR Z27.D, Z15.D, Z15.D |
(2735) 0x4a2d6c LDR Z7, [X12, #507, MUL VL] |
(2735) 0x4a2d70 SUB X12, X29, #64 |
(2735) 0x4a2d74 LD1D {Z13.D}, P0/Z, [X9, X4,LSL #3] |
(2735) 0x4a2d78 FSUB Z12.D, Z12.D, Z7.D |
(2735) 0x4a2d7c LDR Z7, [X12, #506, MUL VL] |
(2735) 0x4a2d80 SUB X12, X29, #64 |
(2735) 0x4a2d84 LD1D {Z14.D}, P0/Z, [X16, X4,LSL #3] |
(2735) 0x4a2d88 FMUL Z15.D, Z15.D, Z12.D |
(2735) 0x4a2d8c FMUL Z26.D, Z0.D, Z12.D |
(2735) 0x4a2d90 FMUL Z12.D, Z3.D, Z12.D |
(2735) 0x4a2d94 FSUB Z13.D, Z13.D, Z7.D |
(2735) 0x4a2d98 LDR Z7, [X12, #505, MUL VL] |
(2735) 0x4a2d9c SUB X12, X29, #64 |
(2735) 0x4a2da0 FMLA Z15.D, P0/M, Z28.D, Z13.D |
(2735) 0x4a2da4 FMLA Z26.D, P0/M, Z1.D, Z13.D |
(2735) 0x4a2da8 FMLA Z12.D, P0/M, Z4.D, Z13.D |
(2735) 0x4a2dac FSUB Z14.D, Z14.D, Z7.D |
(2735) 0x4a2db0 LDR Z7, [X12, #508, MUL VL] |
(2735) 0x4a2db4 SUB X12, X29, #64 |
(2735) 0x4a2db8 FMLA Z15.D, P0/M, Z29.D, Z14.D |
(2735) 0x4a2dbc FMLA Z26.D, P0/M, Z2.D, Z14.D |
(2735) 0x4a2dc0 FMLA Z12.D, P0/M, Z5.D, Z14.D |
(2735) 0x4a2dc4 MOVPRFX Z13, Z15 |
(2735) 0x4a2dc8 FRINTA Z13.D, P0/M, Z15.D |
(2735) 0x4a2dcc MOVPRFX Z14, Z26 |
(2735) 0x4a2dd0 FRINTA Z14.D, P0/M, Z26.D |
(2735) 0x4a2dd4 FSUB Z13.D, Z15.D, Z13.D |
(2735) 0x4a2dd8 FSUB Z26.D, Z26.D, Z14.D |
(2735) 0x4a2ddc MOVPRFX Z14, Z12 |
(2735) 0x4a2de0 FRINTA Z14.D, P0/M, Z12.D |
(2735) 0x4a2de4 FSUB Z12.D, Z12.D, Z14.D |
(2735) 0x4a2de8 FMUL Z14.D, Z6.D, Z13.D |
(2735) 0x4a2dec FMLA Z14.D, P0/M, Z7.D, Z26.D |
(2735) 0x4a2df0 LDR Z7, [X12, #511, MUL VL] |
(2735) 0x4a2df4 SUB X12, X29, #64 |
(2735) 0x4a2df8 FMLA Z14.D, P0/M, Z12.D, Z7.D |
(2735) 0x4a2dfc ST1D {Z14.D}, P0, [X6, X4,LSL #3] |
(2735) 0x4a2e00 LDR Z15, [X12, #510, MUL VL] |
(2735) 0x4a2e04 SUB X12, X29, #64 |
(2735) 0x4a2e08 LDR Z7, [X12, #509, MUL VL] |
(2735) 0x4a2e0c FMUL Z15.D, Z15.D, Z13.D |
(2735) 0x4a2e10 FMUL Z13.D, Z10.D, Z13.D |
(2735) 0x4a2e14 FMLA Z15.D, P0/M, Z7.D, Z26.D |
(2735) 0x4a2e18 FMAD Z26.D, P0/M, Z11.D, Z13.D |
(2735) 0x4a2e1c FMLA Z26.D, P0/M, Z22.D, Z12.D |
(2735) 0x4a2e20 FMLA Z15.D, P0/M, Z9.D, Z12.D |
(2735) 0x4a2e24 FMUL Z12.D, Z14.D, Z14.D |
(2735) 0x4a2e28 ST1D {Z26.D}, P0, [X1, X4,LSL #3] |
(2735) 0x4a2e2c FMAD Z26.D, P0/M, Z26.D, Z12.D |
(2735) 0x4a2e30 ST1D {Z15.D}, P0, [X8, X4,LSL #3] |
(2735) 0x4a2e34 FMLA Z26.D, P0/M, Z15.D, Z15.D |
(2735) 0x4a2e38 ORR Z15.D, Z27.D, Z27.D |
(2735) 0x4a2e3c FSQRT Z26.D, P0/M, Z26.D |
(2735) 0x4a2e40 ST1D {Z26.D}, P0, [X15, X4,LSL #3] |
(2735) 0x4a2e44 ADD X4, X4, X24 |
(2735) 0x4a2e48 CMP X26, X4 |
(2735) 0x4a2e4c B.NE 4a2d60 |
(2733) 0x4a2e50 SUB X12, X29, #64 |
(2733) 0x4a2e54 LDP D1, D0, [SP, #184] |
(2733) 0x4a2e58 LDP D3, D2, [SP, #168] |
(2733) 0x4a2e5c ORR Z28.D, Z5.D, Z5.D |
(2733) 0x4a2e60 LDP D5, D4, [SP, #152] |
(2733) 0x4a2e64 ORR Z29.D, Z6.D, Z6.D |
(2733) 0x4a2e68 ORR Z13.D, Z9.D, Z9.D |
(2733) 0x4a2e6c LDP D7, D6, [SP, #136] |
(2733) 0x4a2e70 LDR Z14, [X12, #508, MUL VL] |
(2733) 0x4a2e74 SUB X12, X29, #64 |
(2733) 0x4a2e78 ORR Z9.D, Z10.D, Z10.D |
(2733) 0x4a2e7c LDR Z12, [X12, #511, MUL VL] |
(2733) 0x4a2e80 SUB X12, X29, #64 |
(2733) 0x4a2e84 ORR Z10.D, Z11.D, Z11.D |
(2733) 0x4a2e88 ORR Z11.D, Z22.D, Z22.D |
(2733) 0x4a2e8c LDR Z27, [X12, #510, MUL VL] |
(2733) 0x4a2e90 SUB X12, X29, #64 |
(2733) 0x4a2e94 LDR Z26, [X12, #509, MUL VL] |
(2733) 0x4a2e98 LDR D22, [SP, #128] |
(2733) 0x4a2e9c CBZ X10, 4a2b8c |
(2733) 0x4a2ea0 SUB X10, X29, #64 |
(2733) 0x4a2ea4 ORR Z13.D, Z29.D, Z29.D |
(2733) 0x4a2ea8 ORR Z29.D, Z28.D, Z28.D |
(2733) 0x4a2eac LDR Z26, [X10, #503, MUL VL] |
(2733) 0x4a2eb0 SUB X10, X29, #64 |
(2733) 0x4a2eb4 LDR Z26, [X10, #504, MUL VL] |
(2733) 0x4a2eb8 HINT #0 |
(2733) 0x4a2ebc HINT #0 |
(2734) 0x4a2ec0 LDR D26, [X21, X28,LSL #3] |
(2734) 0x4a2ec4 LDR D9, [X11, X28,LSL #3] |
(2734) 0x4a2ec8 LDR D10, [X13, X28,LSL #3] |
(2734) 0x4a2ecc FSUB D26, D26, S30 |
(2734) 0x4a2ed0 FSUB D9, D9, S31 |
(2734) 0x4a2ed4 FSUB D10, D10, S8 |
(2734) 0x4a2ed8 FMUL D11, D24, D26 |
(2734) 0x4a2edc FMUL D12, D2, D26 |
(2734) 0x4a2ee0 FMUL D26, D5, D26 |
(2734) 0x4a2ee4 FMADD D11, D0, D9, D11 |
(2734) 0x4a2ee8 FMADD D26, D6, D9, D26 |
(2734) 0x4a2eec FMADD D12, D3, D9, D12 |
(2734) 0x4a2ef0 FMADD D11, D1, D10, D11 |
(2734) 0x4a2ef4 FMADD D26, D7, D10, D26 |
(2734) 0x4a2ef8 FMADD D12, D4, D10, D12 |
(2734) 0x4a2efc FRINTA D9, D11 |
(2734) 0x4a2f00 FRINTA D10, D12 |
(2734) 0x4a2f04 FSUB D9, D11, S9 |
(2734) 0x4a2f08 FRINTA D11, D26 |
(2734) 0x4a2f0c FSUB D10, D12, S10 |
(2734) 0x4a2f10 FMOV D12, D17 |
(2734) 0x4a2f14 FMOV D12, D18 |
(2734) 0x4a2f18 FMOV D12, D19 |
(2734) 0x4a2f1c FMOV D12, D20 |
(2734) 0x4a2f20 FMOV D12, D21 |
(2734) 0x4a2f24 FMOV D12, D16 |
(2734) 0x4a2f28 FSUB D26, D26, S11 |
(2734) 0x4a2f2c FMUL D11, D17, D9 |
(2734) 0x4a2f30 FMADD D11, D18, D10, D11 |
(2734) 0x4a2f34 FMADD D11, D26, D19, D11 |
(2734) 0x4a2f38 STR D11, [X3, X28,LSL #3] |
(2734) 0x4a2f3c FMUL D11, D20, D9 |
(2734) 0x4a2f40 FMUL D9, D22, D9 |
(2734) 0x4a2f44 FMADD D11, D21, D10, D11 |
(2734) 0x4a2f48 FMADD D9, D23, D10, D9 |
(2734) 0x4a2f4c FMADD D11, D16, D26, D11 |
(2734) 0x4a2f50 FMADD D26, D25, D26, D9 |
(2734) 0x4a2f54 STR D11, [X2, X28,LSL #3] |
(2734) 0x4a2f58 STR D26, [X20, X28,LSL #3] |
(2734) 0x4a2f5c FMUL D26, D26, D26 |
(2734) 0x4a2f60 LDR D9, [X3, X28,LSL #3] |
(2734) 0x4a2f64 LDR D10, [X2, X28,LSL #3] |
(2734) 0x4a2f68 FMADD D26, D9, D9, D26 |
(2734) 0x4a2f6c FMADD D26, D10, D10, D26 |
(2734) 0x4a2f70 FSQRT D26, D26 |
(2734) 0x4a2f74 STR D26, [X7, X28,LSL #3] |
(2734) 0x4a2f78 ADD X28, X28, #1 |
(2734) 0x4a2f7c CMP X28, X18 |
(2734) 0x4a2f80 B.LT 4a2ec0 |
(2733) 0x4a2f84 SUB X10, X29, #64 |
(2733) 0x4a2f88 ORR Z28.D, Z29.D, Z29.D |
(2733) 0x4a2f8c ORR Z29.D, Z13.D, Z13.D |
(2733) 0x4a2f90 LDR Z12, [X10, #511, MUL VL] |
(2733) 0x4a2f94 SUB X10, X29, #64 |
(2733) 0x4a2f98 LDR Z27, [X10, #510, MUL VL] |
(2733) 0x4a2f9c SUB X10, X29, #64 |
(2733) 0x4a2fa0 LDR Z26, [X10, #509, MUL VL] |
(2733) 0x4a2fa4 SUB X10, X29, #64 |
(2733) 0x4a2fa8 LDR Z13, [X10, #502, MUL VL] |
(2733) 0x4a2fac SUB X10, X29, #64 |
(2733) 0x4a2fb0 LDR Z9, [X10, #501, MUL VL] |
(2733) 0x4a2fb4 SUB X10, X29, #64 |
(2733) 0x4a2fb8 LDR Z10, [X10, #500, MUL VL] |
(2733) 0x4a2fbc SUB X10, X29, #64 |
(2733) 0x4a2fc0 LDR Z11, [X10, #499, MUL VL] |
(2733) 0x4a2fc4 B 4a2b8c |
0x4a2fc8 SUB X13, X9, #1 |
0x4a2fcc MOVZ W12, #24 |
0x4a2fd0 ADD X1, X8, #8 |
0x4a2fd4 ADD X15, X3, #8 |
0x4a2fd8 ADD X17, X3, #16 |
0x4a2fdc UMULH X12, X13, X12 |
0x4a2fe0 ADD X13, X13, X13,LSL #1 |
0x4a2fe4 UBFM X13, X13, #61, #60 |
0x4a2fe8 ADD X2, X1, X13 |
0x4a2fec CMP XZR, X12 |
0x4a2ff0 ADD X0, X8, X13 |
0x4a2ff4 ADD X16, X15, X13 |
0x4a2ff8 ADD X14, X3, X13 |
0x4a2ffc ADD X18, X17, X13 |
0x4a3000 CSINC W12, WZR, WZR, #0 |
0x4a3004 CMP X2, X1 |
0x4a3008 CCMP X0, X8, #0, #2 |
0x4a300c CCMP X16, X15, #0, #2 |
0x4a3010 CCMP X14, X3, #0, #2 |
0x4a3014 CCMP X18, X17, #0, #2 |
0x4a3018 B.CC 4a2870 |
0x4a301c TBNZ W12, #0, 4a2870 |
0x4a3020 ADD X14, X8, #16 |
0x4a3024 ADD X13, X14, X13 |
0x4a3028 CMP X13, X14 |
0x4a302c B.CC 4a2870 |
0x4a3030 TBNZ W12, #0, 4a2870 |
0x4a3034 ADD X11, X9, X9,LSL #1 |
0x4a3038 UBFM X11, X11, #61, #60 |
0x4a303c ADD X12, X8, X11 |
0x4a3040 CMP X3, X12 |
0x4a3044 B.CS 4a30a4 |
0x4a3048 ADD X11, X3, X11 |
0x4a304c CMP X8, X11 |
0x4a3050 B.CS 4a30a4 |
0x4a3054 ORR X11, XZR, XZR |
0x4a3058 B 4a2870 |
(2732) 0x4a305c LDP X25, X20, [SP, #16] |
(2731) 0x4a3060 ORR X0, XZR, X25 |
(2731) 0x4a3064 BL 46c740 |
(2731) 0x4a3068 ORR X0, XZR, X20 |
(2731) 0x4a306c BL 46c740 |
(2731) 0x4a3070 ADDVL SP, SP, #18 |
(2731) 0x4a3074 ADD SP, SP, #288 |
(2731) 0x4a3078 LDP D9, D8, [SP, #48] |
(2731) 0x4a307c LDP D11, D10, [SP, #32] |
(2731) 0x4a3080 LDP D13, D12, [SP, #16] |
(2731) 0x4a3084 LDP X20, X19, [SP, #144] |
(2731) 0x4a3088 LDP X22, X21, [SP, #128] |
(2731) 0x4a308c LDP X24, X23, [SP, #112] |
(2731) 0x4a3090 LDP X26, X25, [SP, #96] |
(2731) 0x4a3094 LDP X28, X27, [SP, #80] |
(2731) 0x4a3098 LDP X29, X30, [SP, #64] |
(2731) 0x4a309c LDP D15, D14, [SP], #160 |
(2731) 0x4a30a0 RET |
(2731) 0x4a30a4 RDVL X11, #1 |
(2731) 0x4a30a8 ORR X12, XZR, XZR |
(2731) 0x4a30ac UBFM X14, X11, #4, #63 |
(2731) 0x4a30b0 UDIV X11, X9, X10 |
(2731) 0x4a30b4 PTRUE P0.D, ALL |
(2731) 0x4a30b8 ADD X15, X14, X14,LSL #1 |
(2731) 0x4a30bc UBFM X16, X15, #60, #59 |
(2731) 0x4a30c0 UBFM X14, X15, #59, #58 |
(2731) 0x4a30c4 ADD X15, X3, X16 |
(2731) 0x4a30c8 ADD X16, X8, X16 |
(2731) 0x4a30cc MADD X11, X11, X10, XZR |
(2731) 0x4a30d0 SUB X13, X9, X11 |
(2731) 0x4a30d4 ORR X17, XZR, X11 |
(2731) 0x4a30d8 HINT #0 |
(2731) 0x4a30dc HINT #0 |
(2729) 0x4a30e0 ADD X18, X8, X12 |
(2729) 0x4a30e4 ADD X0, X16, X12 |
(2729) 0x4a30e8 LD3D {Z0.D, Z1.D, Z2.D}, P0/Z, [X18, MUL VL] |
(2729) 0x4a30ec LD3D {Z3.D, Z4.D, Z5.D}, P0/Z, [X0, MUL VL] |
(2729) 0x4a30f0 ADD X18, X3, X12 |
(2729) 0x4a30f4 ADD X0, X15, X12 |
(2729) 0x4a30f8 ADD X12, X12, X14 |
(2729) 0x4a30fc SUBS X17, X17, X10 |
(2729) 0x4a3100 ST3D {Z0.D, Z1.D, Z2.D}, P0, [X18, MUL VL] |
(2729) 0x4a3104 ST3D {Z3.D, Z4.D, Z5.D}, P0, [X0, MUL VL] |
(2729) 0x4a3108 B.NE 4a30e0 |
(2731) 0x4a310c CBNZ X13, 4a2870 |
(2731) 0x4a3110 B 4a28b8 |
0x4a3114 BL 40a420 |
0x4a3118 BL 40a420 |
0x4a311c B 4a3128 |
0x4a3120 B 4a3128 |
0x4a3124 B 4a3128 |
0x4a3128 ORR X8, XZR, X20 |
0x4a312c ORR X20, XZR, X0 |
0x4a3130 ORR X0, XZR, X8 |
0x4a3134 BL 46c740 |
0x4a3138 ORR X0, XZR, X20 |
0x4a313c BL 4048e0 |
0x4a3140 BL 40a420 |
0x4a3144 HINT #0 |
0x4a3148 HINT #0 |
0x4a314c HINT #0 |
0x4a3150 HINT #0 |
0x4a3154 HINT #0 |
0x4a3158 HINT #0 |
0x4a315c HINT #0 |
Coverage (%) | Name | Source Location | Module |
---|
Path / |
Source file and lines | SoaDistanceTableABOMPTarget.h:184-233 |
Module | exec |
nb instructions | 96 |
loop length | 384 |
nb stack references | 0 |
front end | 10.88 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 10.00 | 10.00 | 14.25 | 14.25 | 14.25 | 14.25 | 2.00 | 2.00 | 0.50 | 0.50 | 6.00 | 6.00 | 6.00 | 4.00 | 4.00 |
cycles | 10.00 | 10.00 | 14.25 | 14.25 | 14.25 | 14.25 | 2.00 | 2.00 | 0.50 | 0.50 | 6.00 | 6.00 | 6.00 | 4.00 | 4.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 10.88 |
Overall L1 | 14.25 |
all | 10% |
load | NA (no load vectorizable/vectorized instructions) |
store | 100% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP D15, D14, [SP, #864]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D13, D12, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D11, D10, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D9, D8, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP X29, X30, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X28, X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X26, X25, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X24, X23, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X22, X21, [SP, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X20, X19, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADDVL SP, SP, #46 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB SP, SP, #288 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X21, XZR, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X24, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4a4500 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE6resizeEv> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X20, [X24, #440] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR X0, XZR, X20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 46c620 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDP X23, X27, [X24, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD X0, X24, #384 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X1, X27, X27,LSL #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVI D0, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
BL 43e8c0 <_ZN11qmcplusplus6VectorIdNS_12OMPallocatorIdNS_10MallocatorIdLm32EEEEEE6resizeEmd> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X9, [X24, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
CBZ X9, 4a28b0 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0xd0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CNTW X10, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
LDR X8, [X21, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X3, [X24, #408] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MOVZ W11, #32 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X10, #32 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CSEL X11, X10, X11, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X9, X11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
ORR X11, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X3, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
B.CS 4a2fc8 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x7e8> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [X24, #408] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X8, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
SUB X13, X9, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W12, #24 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X1, X8, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X15, X3, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X17, X3, #16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UMULH X12, X13, X12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADD X13, X13, X13,LSL #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X13, X13, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X2, X1, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP XZR, X12 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
ADD X0, X8, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X16, X15, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X14, X3, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X18, X17, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CSINC W12, WZR, WZR, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X2, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CCMP X0, X8, #0, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CCMP X16, X15, #0, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CCMP X14, X3, #0, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CCMP X18, X17, #0, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
B.CC 4a2870 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x90> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TBNZ W12, #0, 4a2870 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x90> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X14, X8, #16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X13, X14, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X13, X14 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CC 4a2870 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x90> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TBNZ W12, #0, 4a2870 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x90> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X11, X9, X9,LSL #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X11, X11, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X12, X8, X11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X3, X12 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CS 4a30a4 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x8c4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X11, X3, X11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X8, X11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CS 4a30a4 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x8c4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X11, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
B 4a2870 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x90> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
BL 40a420 <__clang_call_terminate> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
BL 40a420 <__clang_call_terminate> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4a3128 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x948> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4a3128 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x948> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4a3128 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x948> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X8, XZR, X20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X20, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X0, XZR, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 46c740 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X0, XZR, X20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4048e0 <@plt_start@+0x3b0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
BL 40a420 <__clang_call_terminate> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Source file and lines | SoaDistanceTableABOMPTarget.h:184-233 |
Module | exec |
nb instructions | 96 |
loop length | 384 |
nb stack references | 0 |
front end | 10.88 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 10.00 | 10.00 | 14.25 | 14.25 | 14.25 | 14.25 | 2.00 | 2.00 | 0.50 | 0.50 | 6.00 | 6.00 | 6.00 | 4.00 | 4.00 |
cycles | 10.00 | 10.00 | 14.25 | 14.25 | 14.25 | 14.25 | 2.00 | 2.00 | 0.50 | 0.50 | 6.00 | 6.00 | 6.00 | 4.00 | 4.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 10.88 |
Overall L1 | 14.25 |
all | 10% |
load | NA (no load vectorizable/vectorized instructions) |
store | 100% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP D15, D14, [SP, #864]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D13, D12, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D11, D10, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D9, D8, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP X29, X30, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X28, X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X26, X25, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X24, X23, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X22, X21, [SP, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X20, X19, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADDVL SP, SP, #46 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB SP, SP, #288 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X21, XZR, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X24, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4a4500 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE6resizeEv> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X20, [X24, #440] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR X0, XZR, X20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 46c620 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE5startEv> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDP X23, X27, [X24, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD X0, X24, #384 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X1, X27, X27,LSL #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVI D0, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
BL 43e8c0 <_ZN11qmcplusplus6VectorIdNS_12OMPallocatorIdNS_10MallocatorIdLm32EEEEEE6resizeEmd> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X9, [X24, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
CBZ X9, 4a28b0 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0xd0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CNTW X10, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
LDR X8, [X21, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X3, [X24, #408] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MOVZ W11, #32 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X10, #32 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CSEL X11, X10, X11, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X9, X11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
ORR X11, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X3, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
B.CS 4a2fc8 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x7e8> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [X24, #408] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X8, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
SUB X13, X9, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W12, #24 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X1, X8, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X15, X3, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X17, X3, #16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UMULH X12, X13, X12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
ADD X13, X13, X13,LSL #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X13, X13, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X2, X1, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP XZR, X12 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
ADD X0, X8, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X16, X15, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X14, X3, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X18, X17, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CSINC W12, WZR, WZR, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X2, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CCMP X0, X8, #0, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CCMP X16, X15, #0, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CCMP X14, X3, #0, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CCMP X18, X17, #0, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
B.CC 4a2870 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x90> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TBNZ W12, #0, 4a2870 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x90> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X14, X8, #16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X13, X14, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X13, X14 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CC 4a2870 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x90> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TBNZ W12, #0, 4a2870 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x90> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X11, X9, X9,LSL #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X11, X11, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X12, X8, X11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X3, X12 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CS 4a30a4 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x8c4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X11, X3, X11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X8, X11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CS 4a30a4 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x8c4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X11, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
B 4a2870 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x90> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
BL 40a420 <__clang_call_terminate> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
BL 40a420 <__clang_call_terminate> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4a3128 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x948> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4a3128 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x948> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4a3128 <_ZN11qmcplusplus27SoaDistanceTableABOMPTargetIdLj3ELi40EE8evaluateERNS_11ParticleSetE+0x948> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X8, XZR, X20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X20, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X0, XZR, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 46c740 <_ZN11qmcplusplus9TimerTypeINSt6chrono3_V212system_clockEE4stopEv> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X0, XZR, X20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4048e0 <@plt_start@+0x3b0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
BL 40a420 <__clang_call_terminate> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼qmcplusplus::SoaDistanceTableABOMPTarget | 4.21 | 6.6 |
▼Loop 2732 - SoaDistanceTableABOMPTarget.h:194-233 - exec– | 0.03 | 0.04 |
▼Loop 2733 - SoaDistanceTableABOMPTarget.h:215-228 - exec– | 0.03 | 0.04 |
○Loop 2735 - ParticleBConds3DSoa.h:280-298 - exec | 4.14 | 5.65 |
○Loop 2734 - SoaDistanceTableABOMPTarget.h:228-228 - exec | 0 | 0 |
▼Loop 2731 - SoaDistanceTableABOMPTarget.h:194-233 - exec– | 0 | 0.01 |
○Loop 2730 - SoaDistanceTableABOMPTarget.h:194-196 - exec | 0 | 0.01 |
○Loop 2729 - SoaDistanceTableABOMPTarget.h:194-196 - exec | 0 | 0 |