Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: libseq_mv.so | Source: csr_matvec.c:243-404 [...] | Coverage: 14.93% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: libseq_mv.so | Source: csr_matvec.c:243-404 [...] | Coverage: 14.93% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-716-5699/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
/home/eoseret/qaas_runs_CPU_9468/171-716-5699/intel/AMG/build/AMG/AMG/seq_mv/csr_matrix.c: 645 - 674 |
-------------------------------------------------------------------------------- |
645: HYPRE_Int num_nonzerosA = hypre_CSRMatrixNumNonzeros(A); |
646: HYPRE_Int num_rowsA = hypre_CSRMatrixNumRows(A); |
647: HYPRE_Int *A_i = hypre_CSRMatrixI(A); |
648: |
649: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
650: |
651: HYPRE_Int nonzeros_per_thread = (num_nonzerosA + num_threads - 1)/num_threads; |
652: |
653: if (idx <= 0) |
654: { |
655: return 0; |
656: } |
657: else if (idx >= num_threads) |
[...] |
663: return (HYPRE_Int)(hypre_LowerBound(A_i, A_i + num_rowsA, nonzeros_per_thread*idx) - A_i); |
[...] |
669: return hypre_CSRMatrixGetLoadBalancedPartitionBoundary(A, hypre_GetThreadNum()); |
670: } |
671: |
672: HYPRE_Int hypre_CSRMatrixGetLoadBalancedPartitionEnd(hypre_CSRMatrix *A) |
673: { |
674: return hypre_CSRMatrixGetLoadBalancedPartitionBoundary(A, hypre_GetThreadNum() + 1); |
0xa1c0 PUSH %RBP |
0xa1c1 MOV %RSP,%RBP |
0xa1c4 PUSH %R15 |
0xa1c6 PUSH %R14 |
0xa1c8 PUSH %R13 |
0xa1ca PUSH %R12 |
0xa1cc PUSH %RBX |
0xa1cd SUB $0x28,%RSP |
0xa1d1 MOV %R9,%RBX |
0xa1d4 MOV %R8,%R14 |
0xa1d7 MOV %RCX,%R13 |
0xa1da MOV %RDX,-0x30(%RBP) |
0xa1de CALL 3080 <hypre_GetThreadNum@plt> |
0xa1e3 MOV %RAX,%R15 |
0xa1e6 MOV 0x20(%R13),%R12 |
0xa1ea MOV (%R13),%RAX |
0xa1ee MOV %RAX,-0x48(%RBP) |
0xa1f2 MOV 0x10(%R13),%R13 |
0xa1f6 CALL 3170 <hypre_NumActiveThreads@plt> |
0xa1fb MOV %RAX,%RCX |
0xa1fe LEA -0x1(%R12,%RAX,1),%RAX |
0xa203 MOV %RAX,%RDX |
0xa206 OR %RCX,%RDX |
0xa209 SHR $0x20,%RDX |
0xa20d JE a280 |
0xa20f CQTO |
0xa211 IDIV %RCX |
0xa214 DEC %R12 |
0xa217 TEST %R15,%R15 |
0xa21a MOV %RBX,-0x40(%RBP) |
0xa21e JLE a290 |
0xa220 MOV %R13,-0x38(%RBP) |
0xa224 CMP %R15,%RCX |
0xa227 JLE a298 |
0xa229 MOV -0x48(%RBP),%RBX |
0xa22d LEA (%RBX,%R13,8),%RSI |
0xa231 IMUL %R15,%RAX |
0xa235 MOV %RBX,%RDI |
0xa238 MOV %RAX,%RDX |
0xa23b CALL 3140 <hypre_LowerBound@plt> |
0xa240 SUB %RBX,%RAX |
0xa243 MOV -0x40(%RBP),%RBX |
0xa247 SAR $0x3,%RAX |
0xa24b MOV %RAX,-0x38(%RBP) |
0xa24f JMP a298 |
0xa251 NOPW %CS:(%RAX,%RAX,1) |
0xa260 NOPW %CS:(%RAX,%RAX,1) |
0xa26f NOPW %CS:(%RAX,%RAX,1) |
0xa27e XCHG %AX,%AX |
0xa280 XOR %EDX,%EDX |
0xa282 DIV %ECX |
0xa284 DEC %R12 |
0xa287 TEST %R15,%R15 |
0xa28a MOV %RBX,-0x40(%RBP) |
0xa28e JG a220 |
0xa290 MOVQ $0,-0x38(%RBP) |
0xa298 CALL 3080 <hypre_GetThreadNum@plt> |
0xa29d MOV %RAX,%R15 |
0xa2a0 CALL 3170 <hypre_NumActiveThreads@plt> |
0xa2a5 MOV %RAX,%RCX |
0xa2a8 ADD %RAX,%R12 |
0xa2ab MOV %R12,%RAX |
0xa2ae OR %RCX,%RAX |
0xa2b1 SHR $0x20,%RAX |
0xa2b5 JE a300 |
0xa2b7 MOV %R12,%RAX |
0xa2ba CQTO |
0xa2bc IDIV %RCX |
0xa2bf TEST %R15,%R15 |
0xa2c2 MOV -0x38(%RBP),%R12 |
0xa2c6 JS a310 |
0xa2c8 INC %R15 |
0xa2cb CMP %R15,%RCX |
0xa2ce JG a340 |
0xa2d0 CMP %R13,%R12 |
0xa2d3 JG a36e |
0xa2d9 MOV 0x18(%RBP),%R15 |
0xa2dd TEST %R12,%R12 |
0xa2e0 JNS a3ae |
0xa2e6 JMP a3b3 |
0xa2eb NOPW %CS:(%RAX,%RAX,1) |
0xa2fa NOPW (%RAX,%RAX,1) |
0xa300 MOV %R12D,%EAX |
0xa303 XOR %EDX,%EDX |
0xa305 DIV %ECX |
0xa307 TEST %R15,%R15 |
0xa30a MOV -0x38(%RBP),%R12 |
0xa30e JNS a2c8 |
0xa310 XOR %R13D,%R13D |
0xa313 CMP %R13,%R12 |
0xa316 JLE a2d9 |
0xa318 JMP a36e |
0xa31a NOPW %CS:(%RAX,%RAX,1) |
0xa329 NOPW %CS:(%RAX,%RAX,1) |
0xa338 NOPL (%RAX,%RAX,1) |
0xa340 MOV -0x48(%RBP),%RBX |
0xa344 LEA (%RBX,%R13,8),%RSI |
0xa348 IMUL %R15,%RAX |
0xa34c MOV %RBX,%RDI |
0xa34f MOV %RAX,%RDX |
0xa352 CALL 3140 <hypre_LowerBound@plt> |
0xa357 MOV %RAX,%R13 |
0xa35a SUB %RBX,%R13 |
0xa35d MOV -0x40(%RBP),%RBX |
0xa361 SAR $0x3,%R13 |
0xa365 CMP %R13,%R12 |
0xa368 JLE a2d9 |
0xa36e MOV 0xac6b(%RIP),%RAX |
0xa375 MOV (%RAX),%RDI |
0xa378 LEA 0x5fee(%RIP),%RSI |
0xa37f LEA 0x5f8f(%RIP),%RDX |
0xa386 XOR %EAX,%EAX |
0xa388 CALL 31e0 <hypre_fprintf@plt> |
0xa38d LEA 0x5efe(%RIP),%RDI |
0xa394 MOV $0xf8,%ESI |
0xa399 MOV $0x1,%EDX |
0xa39e XOR %ECX,%ECX |
0xa3a0 CALL 3220 <hypre_error_handler@plt> |
0xa3a5 MOV 0x18(%RBP),%R15 |
0xa3a9 TEST %R12,%R12 |
0xa3ac JS a3b3 |
0xa3ae CMP %R15,%R12 |
0xa3b1 JLE a3ea |
0xa3b3 MOV 0xac26(%RIP),%RAX |
0xa3ba MOV (%RAX),%RDI |
0xa3bd LEA 0x5fa9(%RIP),%RSI |
0xa3c4 LEA 0x5f59(%RIP),%RDX |
0xa3cb XOR %EAX,%EAX |
0xa3cd CALL 31e0 <hypre_fprintf@plt> |
0xa3d2 LEA 0x5eb9(%RIP),%RDI |
0xa3d9 MOV $0xf9,%ESI |
0xa3de MOV $0x1,%EDX |
0xa3e3 XOR %ECX,%ECX |
0xa3e5 CALL 3220 <hypre_error_handler@plt> |
0xa3ea VMOVSD 0x38(%RBP),%XMM5 |
0xa3ef TEST %R13,%R13 |
0xa3f2 JS a3f9 |
0xa3f4 CMP %R15,%R13 |
0xa3f7 JLE a435 |
0xa3f9 MOV 0xabe0(%RIP),%RAX |
0xa400 MOV (%RAX),%RDI |
0xa403 LEA 0x5f63(%RIP),%RSI |
0xa40a LEA 0x5f35(%RIP),%RDX |
0xa411 XOR %EAX,%EAX |
0xa413 CALL 31e0 <hypre_fprintf@plt> |
0xa418 LEA 0x5e73(%RIP),%RDI |
0xa41f MOV $0xfa,%ESI |
0xa424 MOV $0x1,%EDX |
0xa429 XOR %ECX,%ECX |
0xa42b CALL 3220 <hypre_error_handler@plt> |
0xa430 VMOVSD 0x38(%RBP),%XMM5 |
0xa435 MOV 0x20(%RBP),%RCX |
0xa439 MOV 0x10(%RBP),%RDX |
0xa43d VMOVSD -0x30(%RBP),%XMM0 |
0xa442 VXORPD %XMM1,%XMM1,%XMM1 |
0xa446 VUCOMISD %XMM1,%XMM5 |
0xa44a JNE a580 |
0xa450 VUCOMISD 0x5bb8(%RIP),%XMM0 |
0xa458 JNE a6c0 |
0xa45e CMP %R13,%R12 |
0xa461 JGE b340 |
0xa467 MOV %R12,%RAX |
0xa46a NOT %RAX |
0xa46d ADD %RAX,%R13 |
0xa470 XOR %ESI,%ESI |
0xa472 JMP a496 |
0xa474 NOPW %CS:(%RAX,%RAX,1) |
(183) 0xa480 MOV 0x30(%RBP),%RAX |
(183) 0xa484 VMOVSD %XMM0,(%RAX,%RDI,8) |
(183) 0xa489 CMP %R13,%RSI |
(183) 0xa48c LEA 0x1(%RSI),%RSI |
(183) 0xa490 JE b340 |
(183) 0xa496 LEA (%R12,%RSI,1),%RDI |
(183) 0xa49a MOV (%RBX,%RDI,8),%R10 |
(183) 0xa49e MOV 0x8(%RBX,%RDI,8),%R8 |
(183) 0xa4a3 VXORPD %XMM0,%XMM0,%XMM0 |
(183) 0xa4a7 MOV %R8,%R11 |
(183) 0xa4aa SUB %R10,%R11 |
(183) 0xa4ad JLE a480 |
(183) 0xa4af MOV %R11,%R9 |
(183) 0xa4b2 AND $-0x4,%R9 |
(183) 0xa4b6 JE a540 |
(183) 0xa4bc MOV %R13,%RBX |
(183) 0xa4bf LEA -0x1(%R9),%R15 |
(183) 0xa4c3 LEA (%R14,%R10,8),%R12 |
(183) 0xa4c7 LEA (%RDX,%R10,8),%R13 |
(183) 0xa4cb VXORPD %XMM0,%XMM0,%XMM0 |
(183) 0xa4cf XOR %EAX,%EAX |
(183) 0xa4d1 NOPW %CS:(%RAX,%RAX,1) |
(185) 0xa4e0 VMOVUPD (%R13,%RAX,8),%YMM1 |
(185) 0xa4e7 KXNORW %K0,%K0,%K1 |
(185) 0xa4eb VXORPD %XMM2,%XMM2,%XMM2 |
(185) 0xa4ef VGATHERQPD (%RCX,%YMM1,8),%YMM2{%K1} |
(185) 0xa4f6 VFMADD231PD (%R12,%RAX,8),%YMM2,%YMM0 |
(185) 0xa4fc ADD $0x4,%RAX |
(185) 0xa500 CMP %R15,%RAX |
(185) 0xa503 JBE a4e0 |
(183) 0xa505 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(183) 0xa50b VADDPD %XMM1,%XMM0,%XMM0 |
(183) 0xa50f VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(183) 0xa514 VADDSD %XMM1,%XMM0,%XMM0 |
(183) 0xa518 CMP %R9,%R11 |
(183) 0xa51b MOV %RBX,%R13 |
(183) 0xa51e MOV -0x40(%RBP),%RBX |
(183) 0xa522 MOV -0x38(%RBP),%R12 |
(183) 0xa526 JE a480 |
(183) 0xa52c JMP a543 |
0xa52e NOPW %CS:(%RAX,%RAX,1) |
0xa53d NOPL (%RAX) |
(183) 0xa540 XOR %R9D,%R9D |
(183) 0xa543 ADD %R10,%R9 |
(183) 0xa546 NOPW %CS:(%RAX,%RAX,1) |
(184) 0xa550 MOV (%RDX,%R9,8),%RAX |
(184) 0xa554 VMOVSD (%RCX,%RAX,8),%XMM1 |
(184) 0xa559 VFMADD231SD (%R14,%R9,8),%XMM1,%XMM0 |
(184) 0xa55f INC %R9 |
(184) 0xa562 CMP %R9,%R8 |
(184) 0xa565 JNE a550 |
(183) 0xa567 JMP a480 |
0xa56c NOPW %CS:(%RAX,%RAX,1) |
0xa57b NOPL (%RAX,%RAX,1) |
0xa580 MOV 0x28(%RBP),%RSI |
0xa584 VUCOMISD 0x5a8c(%RIP),%XMM5 |
0xa58c JNE a800 |
0xa592 VUCOMISD 0x5a76(%RIP),%XMM0 |
0xa59a JNE a940 |
0xa5a0 CMP %R13,%R12 |
0xa5a3 JGE b340 |
0xa5a9 MOV %R12,%RAX |
0xa5ac NOT %RAX |
0xa5af ADD %RAX,%R13 |
0xa5b2 XOR %EDI,%EDI |
0xa5b4 VMOVDDUP 0x5a64(%RIP),%XMM0 |
0xa5bc JMP a5d7 |
0xa5be XCHG %AX,%AX |
(174) 0xa5c0 MOV 0x30(%RBP),%RAX |
(174) 0xa5c4 VMOVSD %XMM1,(%RAX,%R8,8) |
(174) 0xa5ca CMP %R13,%RDI |
(174) 0xa5cd LEA 0x1(%RDI),%RDI |
(174) 0xa5d1 JE b340 |
(174) 0xa5d7 LEA (%R12,%RDI,1),%R8 |
(174) 0xa5db VMOVSD (%RSI,%R8,8),%XMM1 |
(174) 0xa5e1 VXORPD %XMM0,%XMM1,%XMM1 |
(174) 0xa5e5 MOV (%RBX,%R8,8),%R11 |
(174) 0xa5e9 MOV 0x8(%RBX,%R8,8),%R9 |
(174) 0xa5ee MOV %R9,%R15 |
(174) 0xa5f1 SUB %R11,%R15 |
(174) 0xa5f4 JLE a5c0 |
(174) 0xa5f6 MOV %R15,%R10 |
(174) 0xa5f9 AND $-0x4,%R10 |
(174) 0xa5fd JE a680 |
(174) 0xa603 MOV %R13,%RBX |
(174) 0xa606 LEA -0x1(%R10),%R12 |
(174) 0xa60a LEA (%R14,%R11,8),%R13 |
(174) 0xa60e LEA (%RDX,%R11,8),%RSI |
(174) 0xa612 VXORPD %XMM2,%XMM2,%XMM2 |
(174) 0xa616 XOR %EAX,%EAX |
(174) 0xa618 NOPL (%RAX,%RAX,1) |
(176) 0xa620 VMOVUPD (%RSI,%RAX,8),%YMM3 |
(176) 0xa625 KXNORW %K0,%K0,%K1 |
(176) 0xa629 VXORPD %XMM4,%XMM4,%XMM4 |
(176) 0xa62d VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(176) 0xa634 VFMADD231PD (%R13,%RAX,8),%YMM4,%YMM2 |
(176) 0xa63b ADD $0x4,%RAX |
(176) 0xa63f CMP %R12,%RAX |
(176) 0xa642 JBE a620 |
(174) 0xa644 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(174) 0xa64a VADDPD %XMM3,%XMM2,%XMM2 |
(174) 0xa64e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(174) 0xa653 VADDSD %XMM3,%XMM2,%XMM2 |
(174) 0xa657 VADDSD %XMM2,%XMM1,%XMM1 |
(174) 0xa65b CMP %R10,%R15 |
(174) 0xa65e MOV %RBX,%R13 |
(174) 0xa661 MOV -0x40(%RBP),%RBX |
(174) 0xa665 MOV -0x38(%RBP),%R12 |
(174) 0xa669 MOV 0x28(%RBP),%RSI |
(174) 0xa66d JE a5c0 |
(174) 0xa673 JMP a683 |
0xa675 NOPW %CS:(%RAX,%RAX,1) |
(174) 0xa680 XOR %R10D,%R10D |
(174) 0xa683 ADD %R11,%R10 |
(174) 0xa686 NOPW %CS:(%RAX,%RAX,1) |
(175) 0xa690 MOV (%RDX,%R10,8),%RAX |
(175) 0xa694 VMOVSD (%RCX,%RAX,8),%XMM2 |
(175) 0xa699 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(175) 0xa69f INC %R10 |
(175) 0xa6a2 CMP %R10,%R9 |
(175) 0xa6a5 JNE a690 |
(174) 0xa6a7 JMP a5c0 |
0xa6ac NOPW %CS:(%RAX,%RAX,1) |
0xa6bb NOPL (%RAX,%RAX,1) |
0xa6c0 VUCOMISD 0x5950(%RIP),%XMM0 |
0xa6c8 JNE aa80 |
0xa6ce CMP %R13,%R12 |
0xa6d1 JGE b340 |
0xa6d7 MOV %R12,%RAX |
0xa6da NOT %RAX |
0xa6dd ADD %RAX,%R13 |
0xa6e0 XOR %ESI,%ESI |
0xa6e2 JMP a716 |
0xa6e4 NOPW %CS:(%RAX,%RAX,1) |
0xa6f3 NOPW %CS:(%RAX,%RAX,1) |
(180) 0xa700 MOV 0x30(%RBP),%RAX |
(180) 0xa704 VMOVSD %XMM0,(%RAX,%RDI,8) |
(180) 0xa709 CMP %R13,%RSI |
(180) 0xa70c LEA 0x1(%RSI),%RSI |
(180) 0xa710 JE b340 |
(180) 0xa716 LEA (%R12,%RSI,1),%RDI |
(180) 0xa71a MOV (%RBX,%RDI,8),%R10 |
(180) 0xa71e MOV 0x8(%RBX,%RDI,8),%R8 |
(180) 0xa723 VXORPD %XMM0,%XMM0,%XMM0 |
(180) 0xa727 MOV %R8,%R11 |
(180) 0xa72a SUB %R10,%R11 |
(180) 0xa72d JLE a700 |
(180) 0xa72f MOV %R11,%R9 |
(180) 0xa732 AND $-0x4,%R9 |
(180) 0xa736 JE a7c0 |
(180) 0xa73c MOV %R13,%RBX |
(180) 0xa73f LEA -0x1(%R9),%R15 |
(180) 0xa743 LEA (%R14,%R10,8),%R12 |
(180) 0xa747 LEA (%RDX,%R10,8),%R13 |
(180) 0xa74b VXORPD %XMM0,%XMM0,%XMM0 |
(180) 0xa74f XOR %EAX,%EAX |
(180) 0xa751 NOPW %CS:(%RAX,%RAX,1) |
(182) 0xa760 VMOVUPD (%R13,%RAX,8),%YMM1 |
(182) 0xa767 VXORPD %XMM2,%XMM2,%XMM2 |
(182) 0xa76b KXNORW %K0,%K0,%K1 |
(182) 0xa76f VGATHERQPD (%RCX,%YMM1,8),%YMM2{%K1} |
(182) 0xa776 VFNMADD231PD (%R12,%RAX,8),%YMM2,%YMM0 |
(182) 0xa77c ADD $0x4,%RAX |
(182) 0xa780 CMP %R15,%RAX |
(182) 0xa783 JBE a760 |
(180) 0xa785 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(180) 0xa78b VADDPD %XMM1,%XMM0,%XMM0 |
(180) 0xa78f VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(180) 0xa794 VADDSD %XMM1,%XMM0,%XMM0 |
(180) 0xa798 CMP %R9,%R11 |
(180) 0xa79b MOV %RBX,%R13 |
(180) 0xa79e MOV -0x40(%RBP),%RBX |
(180) 0xa7a2 MOV -0x38(%RBP),%R12 |
(180) 0xa7a6 JE a700 |
(180) 0xa7ac JMP a7c3 |
0xa7ae NOPW %CS:(%RAX,%RAX,1) |
0xa7bd NOPL (%RAX) |
(180) 0xa7c0 XOR %R9D,%R9D |
(180) 0xa7c3 ADD %R10,%R9 |
(180) 0xa7c6 NOPW %CS:(%RAX,%RAX,1) |
(181) 0xa7d0 MOV (%RDX,%R9,8),%RAX |
(181) 0xa7d4 VMOVSD (%RCX,%RAX,8),%XMM1 |
(181) 0xa7d9 VFNMADD231SD (%R14,%R9,8),%XMM1,%XMM0 |
(181) 0xa7df INC %R9 |
(181) 0xa7e2 CMP %R9,%R8 |
(181) 0xa7e5 JNE a7d0 |
(180) 0xa7e7 JMP a700 |
0xa7ec NOPW %CS:(%RAX,%RAX,1) |
0xa7fb NOPL (%RAX,%RAX,1) |
0xa800 VUCOMISD 0x5808(%RIP),%XMM5 |
0xa808 JNE abc0 |
0xa80e VUCOMISD 0x57fa(%RIP),%XMM0 |
0xa816 JNE ad00 |
0xa81c CMP %R13,%R12 |
0xa81f JGE b340 |
0xa825 MOV %R12,%RAX |
0xa828 NOT %RAX |
0xa82b ADD %RAX,%R13 |
0xa82e XOR %EDI,%EDI |
0xa830 MOV %R13,-0x30(%RBP) |
0xa834 JMP a857 |
0xa836 NOPW %CS:(%RAX,%RAX,1) |
(165) 0xa840 MOV 0x30(%RBP),%RAX |
(165) 0xa844 VMOVSD %XMM0,(%RAX,%R8,8) |
(165) 0xa84a CMP %R13,%RDI |
(165) 0xa84d LEA 0x1(%RDI),%RDI |
(165) 0xa851 JE b340 |
(165) 0xa857 LEA (%R12,%RDI,1),%R8 |
(165) 0xa85b VMOVSD (%RSI,%R8,8),%XMM0 |
(165) 0xa861 MOV (%RBX,%R8,8),%R11 |
(165) 0xa865 MOV 0x8(%RBX,%R8,8),%R9 |
(165) 0xa86a MOV %R9,%R15 |
(165) 0xa86d SUB %R11,%R15 |
(165) 0xa870 JLE a840 |
(165) 0xa872 MOV %R15,%R10 |
(165) 0xa875 AND $-0x4,%R10 |
(165) 0xa879 JE a900 |
(165) 0xa87f LEA -0x1(%R10),%R12 |
(165) 0xa883 LEA (%R14,%R11,8),%R13 |
(165) 0xa887 LEA (%RDX,%R11,8),%RSI |
(165) 0xa88b VXORPD %XMM1,%XMM1,%XMM1 |
(165) 0xa88f XOR %EAX,%EAX |
(165) 0xa891 NOPW %CS:(%RAX,%RAX,1) |
(167) 0xa8a0 VMOVUPD (%RSI,%RAX,8),%YMM2 |
(167) 0xa8a5 VXORPD %XMM3,%XMM3,%XMM3 |
(167) 0xa8a9 KXNORW %K0,%K0,%K1 |
(167) 0xa8ad VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(167) 0xa8b4 VFMADD231PD (%R13,%RAX,8),%YMM3,%YMM1 |
(167) 0xa8bb ADD $0x4,%RAX |
(167) 0xa8bf CMP %R12,%RAX |
(167) 0xa8c2 JBE a8a0 |
(165) 0xa8c4 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(165) 0xa8ca VADDPD %XMM2,%XMM1,%XMM1 |
(165) 0xa8ce VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(165) 0xa8d3 VADDSD %XMM2,%XMM1,%XMM1 |
(165) 0xa8d7 VADDSD %XMM1,%XMM0,%XMM0 |
(165) 0xa8db CMP %R10,%R15 |
(165) 0xa8de MOV -0x30(%RBP),%R13 |
(165) 0xa8e2 MOV -0x38(%RBP),%R12 |
(165) 0xa8e6 MOV 0x28(%RBP),%RSI |
(165) 0xa8ea JE a840 |
(165) 0xa8f0 JMP a903 |
0xa8f2 NOPW %CS:(%RAX,%RAX,1) |
(165) 0xa900 XOR %R10D,%R10D |
(165) 0xa903 ADD %R11,%R10 |
(165) 0xa906 NOPW %CS:(%RAX,%RAX,1) |
(166) 0xa910 MOV (%RDX,%R10,8),%RAX |
(166) 0xa914 VMOVSD (%RCX,%RAX,8),%XMM1 |
(166) 0xa919 VFMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(166) 0xa91f INC %R10 |
(166) 0xa922 CMP %R10,%R9 |
(166) 0xa925 JNE a910 |
(165) 0xa927 JMP a840 |
0xa92c NOPW %CS:(%RAX,%RAX,1) |
0xa93b NOPL (%RAX,%RAX,1) |
0xa940 VUCOMISD 0x56d0(%RIP),%XMM0 |
0xa948 JNE ae40 |
0xa94e CMP %R13,%R12 |
0xa951 JGE b340 |
0xa957 MOV %R12,%RAX |
0xa95a NOT %RAX |
0xa95d ADD %RAX,%R13 |
0xa960 XOR %EDI,%EDI |
0xa962 MOV %R13,-0x30(%RBP) |
0xa966 JMP a997 |
0xa968 NOPW %CS:(%RAX,%RAX,1) |
0xa977 NOPW (%RAX,%RAX,1) |
(171) 0xa980 MOV 0x30(%RBP),%RAX |
(171) 0xa984 VMOVSD %XMM0,(%RAX,%R8,8) |
(171) 0xa98a CMP %R13,%RDI |
(171) 0xa98d LEA 0x1(%RDI),%RDI |
(171) 0xa991 JE b340 |
(171) 0xa997 LEA (%R12,%RDI,1),%R8 |
(171) 0xa99b VMOVSD (%RSI,%R8,8),%XMM0 |
(171) 0xa9a1 MOV (%RBX,%R8,8),%R11 |
(171) 0xa9a5 MOV 0x8(%RBX,%R8,8),%R9 |
(171) 0xa9aa MOV %R9,%R15 |
(171) 0xa9ad SUB %R11,%R15 |
(171) 0xa9b0 JLE a980 |
(171) 0xa9b2 MOV %R15,%R10 |
(171) 0xa9b5 AND $-0x4,%R10 |
(171) 0xa9b9 JE aa40 |
(171) 0xa9bf LEA -0x1(%R10),%R12 |
(171) 0xa9c3 LEA (%R14,%R11,8),%R13 |
(171) 0xa9c7 LEA (%RDX,%R11,8),%RSI |
(171) 0xa9cb VXORPD %XMM1,%XMM1,%XMM1 |
(171) 0xa9cf XOR %EAX,%EAX |
(171) 0xa9d1 NOPW %CS:(%RAX,%RAX,1) |
(173) 0xa9e0 VMOVUPD (%RSI,%RAX,8),%YMM2 |
(173) 0xa9e5 KXNORW %K0,%K0,%K1 |
(173) 0xa9e9 VXORPD %XMM3,%XMM3,%XMM3 |
(173) 0xa9ed VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(173) 0xa9f4 VFNMADD231PD (%R13,%RAX,8),%YMM3,%YMM1 |
(173) 0xa9fb ADD $0x4,%RAX |
(173) 0xa9ff CMP %R12,%RAX |
(173) 0xaa02 JBE a9e0 |
(171) 0xaa04 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(171) 0xaa0a VADDPD %XMM2,%XMM1,%XMM1 |
(171) 0xaa0e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(171) 0xaa13 VADDSD %XMM2,%XMM1,%XMM1 |
(171) 0xaa17 VADDSD %XMM1,%XMM0,%XMM0 |
(171) 0xaa1b CMP %R10,%R15 |
(171) 0xaa1e MOV -0x30(%RBP),%R13 |
(171) 0xaa22 MOV -0x38(%RBP),%R12 |
(171) 0xaa26 MOV 0x28(%RBP),%RSI |
(171) 0xaa2a JE a980 |
(171) 0xaa30 JMP aa43 |
0xaa32 NOPW %CS:(%RAX,%RAX,1) |
(171) 0xaa40 XOR %R10D,%R10D |
(171) 0xaa43 ADD %R11,%R10 |
(171) 0xaa46 NOPW %CS:(%RAX,%RAX,1) |
(172) 0xaa50 MOV (%RDX,%R10,8),%RAX |
(172) 0xaa54 VMOVSD (%RCX,%RAX,8),%XMM1 |
(172) 0xaa59 VFNMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(172) 0xaa5f INC %R10 |
(172) 0xaa62 CMP %R10,%R9 |
(172) 0xaa65 JNE aa50 |
(171) 0xaa67 JMP a980 |
0xaa6c NOPW %CS:(%RAX,%RAX,1) |
0xaa7b NOPL (%RAX,%RAX,1) |
0xaa80 CMP %R13,%R12 |
0xaa83 JGE b340 |
0xaa89 MOV %R12,%RAX |
0xaa8c NOT %RAX |
0xaa8f ADD %RAX,%R13 |
0xaa92 XOR %ESI,%ESI |
0xaa94 JMP aada |
0xaa96 NOPW %CS:(%RAX,%RAX,1) |
0xaaa5 NOPW %CS:(%RAX,%RAX,1) |
0xaab4 NOPW %CS:(%RAX,%RAX,1) |
(177) 0xaac0 VMULSD %XMM0,%XMM1,%XMM1 |
(177) 0xaac4 MOV 0x30(%RBP),%RAX |
(177) 0xaac8 VMOVSD %XMM1,(%RAX,%RDI,8) |
(177) 0xaacd CMP %R13,%RSI |
(177) 0xaad0 LEA 0x1(%RSI),%RSI |
(177) 0xaad4 JE b340 |
(177) 0xaada LEA (%R12,%RSI,1),%RDI |
(177) 0xaade MOV (%RBX,%RDI,8),%R10 |
(177) 0xaae2 MOV 0x8(%RBX,%RDI,8),%R8 |
(177) 0xaae7 VXORPD %XMM1,%XMM1,%XMM1 |
(177) 0xaaeb MOV %R8,%R11 |
(177) 0xaaee SUB %R10,%R11 |
(177) 0xaaf1 JLE aac0 |
(177) 0xaaf3 MOV %R11,%R9 |
(177) 0xaaf6 AND $-0x4,%R9 |
(177) 0xaafa JE ab80 |
(177) 0xab00 MOV %R13,%RBX |
(177) 0xab03 LEA -0x1(%R9),%R15 |
(177) 0xab07 LEA (%R14,%R10,8),%R12 |
(177) 0xab0b LEA (%RDX,%R10,8),%R13 |
(177) 0xab0f VXORPD %XMM1,%XMM1,%XMM1 |
(177) 0xab13 XOR %EAX,%EAX |
(177) 0xab15 NOPW %CS:(%RAX,%RAX,1) |
(179) 0xab20 VMOVUPD (%R13,%RAX,8),%YMM2 |
(179) 0xab27 VXORPD %XMM3,%XMM3,%XMM3 |
(179) 0xab2b KXNORW %K0,%K0,%K1 |
(179) 0xab2f VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(179) 0xab36 VFMADD231PD (%R12,%RAX,8),%YMM3,%YMM1 |
(179) 0xab3c ADD $0x4,%RAX |
(179) 0xab40 CMP %R15,%RAX |
(179) 0xab43 JBE ab20 |
(177) 0xab45 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(177) 0xab4b VADDPD %XMM2,%XMM1,%XMM1 |
(177) 0xab4f VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(177) 0xab54 VADDSD %XMM2,%XMM1,%XMM1 |
(177) 0xab58 CMP %R9,%R11 |
(177) 0xab5b MOV %RBX,%R13 |
(177) 0xab5e MOV -0x40(%RBP),%RBX |
(177) 0xab62 MOV -0x38(%RBP),%R12 |
(177) 0xab66 JE aac0 |
(177) 0xab6c JMP ab83 |
0xab6e NOPW %CS:(%RAX,%RAX,1) |
0xab7d NOPL (%RAX) |
(177) 0xab80 XOR %R9D,%R9D |
(177) 0xab83 ADD %R10,%R9 |
(177) 0xab86 NOPW %CS:(%RAX,%RAX,1) |
(178) 0xab90 MOV (%RDX,%R9,8),%RAX |
(178) 0xab94 VMOVSD (%RCX,%RAX,8),%XMM2 |
(178) 0xab99 VFMADD231SD (%R14,%R9,8),%XMM2,%XMM1 |
(178) 0xab9f INC %R9 |
(178) 0xaba2 CMP %R9,%R8 |
(178) 0xaba5 JNE ab90 |
(177) 0xaba7 JMP aac0 |
0xabac NOPW %CS:(%RAX,%RAX,1) |
0xabbb NOPL (%RAX,%RAX,1) |
0xabc0 VUCOMISD 0x5448(%RIP),%XMM0 |
0xabc8 JNE af80 |
0xabce CMP %R13,%R12 |
0xabd1 JGE b340 |
0xabd7 MOV %R12,%RAX |
0xabda NOT %RAX |
0xabdd ADD %RAX,%R13 |
0xabe0 XOR %EDI,%EDI |
0xabe2 MOV %R13,-0x30(%RBP) |
0xabe6 JMP ac17 |
0xabe8 NOPW %CS:(%RAX,%RAX,1) |
0xabf7 NOPW (%RAX,%RAX,1) |
(156) 0xac00 MOV 0x30(%RBP),%RAX |
(156) 0xac04 VMOVSD %XMM0,(%RAX,%R8,8) |
(156) 0xac0a CMP %R13,%RDI |
(156) 0xac0d LEA 0x1(%RDI),%RDI |
(156) 0xac11 JE b340 |
(156) 0xac17 LEA (%R12,%RDI,1),%R8 |
(156) 0xac1b VMULSD (%RSI,%R8,8),%XMM5,%XMM0 |
(156) 0xac21 MOV (%RBX,%R8,8),%R11 |
(156) 0xac25 MOV 0x8(%RBX,%R8,8),%R9 |
(156) 0xac2a MOV %R9,%R15 |
(156) 0xac2d SUB %R11,%R15 |
(156) 0xac30 JLE ac00 |
(156) 0xac32 MOV %R15,%R10 |
(156) 0xac35 AND $-0x4,%R10 |
(156) 0xac39 JE acc0 |
(156) 0xac3f LEA -0x1(%R10),%R12 |
(156) 0xac43 LEA (%R14,%R11,8),%R13 |
(156) 0xac47 LEA (%RDX,%R11,8),%RSI |
(156) 0xac4b VXORPD %XMM1,%XMM1,%XMM1 |
(156) 0xac4f XOR %EAX,%EAX |
(156) 0xac51 NOPW %CS:(%RAX,%RAX,1) |
(158) 0xac60 VMOVUPD (%RSI,%RAX,8),%YMM2 |
(158) 0xac65 KXNORW %K0,%K0,%K1 |
(158) 0xac69 VXORPD %XMM3,%XMM3,%XMM3 |
(158) 0xac6d VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(158) 0xac74 VFMADD231PD (%R13,%RAX,8),%YMM3,%YMM1 |
(158) 0xac7b ADD $0x4,%RAX |
(158) 0xac7f CMP %R12,%RAX |
(158) 0xac82 JBE ac60 |
(156) 0xac84 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(156) 0xac8a VADDPD %XMM2,%XMM1,%XMM1 |
(156) 0xac8e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(156) 0xac93 VADDSD %XMM2,%XMM1,%XMM1 |
(156) 0xac97 VADDSD %XMM1,%XMM0,%XMM0 |
(156) 0xac9b CMP %R10,%R15 |
(156) 0xac9e MOV -0x30(%RBP),%R13 |
(156) 0xaca2 MOV -0x38(%RBP),%R12 |
(156) 0xaca6 MOV 0x28(%RBP),%RSI |
(156) 0xacaa JE ac00 |
(156) 0xacb0 JMP acc3 |
0xacb2 NOPW %CS:(%RAX,%RAX,1) |
(156) 0xacc0 XOR %R10D,%R10D |
(156) 0xacc3 ADD %R11,%R10 |
(156) 0xacc6 NOPW %CS:(%RAX,%RAX,1) |
(157) 0xacd0 MOV (%RDX,%R10,8),%RAX |
(157) 0xacd4 VMOVSD (%RCX,%RAX,8),%XMM1 |
(157) 0xacd9 VFMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(157) 0xacdf INC %R10 |
(157) 0xace2 CMP %R10,%R9 |
(157) 0xace5 JNE acd0 |
(156) 0xace7 JMP ac00 |
0xacec NOPW %CS:(%RAX,%RAX,1) |
0xacfb NOPL (%RAX,%RAX,1) |
0xad00 VUCOMISD 0x5310(%RIP),%XMM0 |
0xad08 JNE b0c0 |
0xad0e CMP %R13,%R12 |
0xad11 JGE b340 |
0xad17 MOV %R12,%RAX |
0xad1a NOT %RAX |
0xad1d ADD %RAX,%R13 |
0xad20 XOR %EDI,%EDI |
0xad22 VMOVDDUP 0x52f6(%RIP),%XMM0 |
0xad2a MOV %R13,-0x30(%RBP) |
0xad2e JMP ad57 |
0xad30 NOPW %CS:(%RAX,%RAX,1) |
0xad3f NOP |
(162) 0xad40 MOV 0x30(%RBP),%RAX |
(162) 0xad44 VMOVSD %XMM1,(%RAX,%R8,8) |
(162) 0xad4a CMP %R13,%RDI |
(162) 0xad4d LEA 0x1(%RDI),%RDI |
(162) 0xad51 JE b340 |
(162) 0xad57 LEA (%R12,%RDI,1),%R8 |
(162) 0xad5b VMOVSD (%RSI,%R8,8),%XMM1 |
(162) 0xad61 VXORPD %XMM0,%XMM1,%XMM1 |
(162) 0xad65 MOV (%RBX,%R8,8),%R11 |
(162) 0xad69 MOV 0x8(%RBX,%R8,8),%R9 |
(162) 0xad6e MOV %R9,%R15 |
(162) 0xad71 SUB %R11,%R15 |
(162) 0xad74 JLE ad40 |
(162) 0xad76 MOV %R15,%R10 |
(162) 0xad79 AND $-0x4,%R10 |
(162) 0xad7d JE ae00 |
(162) 0xad83 LEA -0x1(%R10),%R12 |
(162) 0xad87 LEA (%R14,%R11,8),%R13 |
(162) 0xad8b LEA (%RDX,%R11,8),%RSI |
(162) 0xad8f VXORPD %XMM2,%XMM2,%XMM2 |
(162) 0xad93 XOR %EAX,%EAX |
(162) 0xad95 NOPW %CS:(%RAX,%RAX,1) |
(164) 0xada0 VMOVUPD (%RSI,%RAX,8),%YMM3 |
(164) 0xada5 VXORPD %XMM4,%XMM4,%XMM4 |
(164) 0xada9 KXNORW %K0,%K0,%K1 |
(164) 0xadad VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(164) 0xadb4 VFNMADD231PD (%R13,%RAX,8),%YMM4,%YMM2 |
(164) 0xadbb ADD $0x4,%RAX |
(164) 0xadbf CMP %R12,%RAX |
(164) 0xadc2 JBE ada0 |
(162) 0xadc4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(162) 0xadca VADDPD %XMM3,%XMM2,%XMM2 |
(162) 0xadce VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(162) 0xadd3 VADDSD %XMM3,%XMM2,%XMM2 |
(162) 0xadd7 VADDSD %XMM2,%XMM1,%XMM1 |
(162) 0xaddb CMP %R10,%R15 |
(162) 0xadde MOV -0x30(%RBP),%R13 |
(162) 0xade2 MOV -0x38(%RBP),%R12 |
(162) 0xade6 MOV 0x28(%RBP),%RSI |
(162) 0xadea JE ad40 |
(162) 0xadf0 JMP ae03 |
0xadf2 NOPW %CS:(%RAX,%RAX,1) |
(162) 0xae00 XOR %R10D,%R10D |
(162) 0xae03 ADD %R11,%R10 |
(162) 0xae06 NOPW %CS:(%RAX,%RAX,1) |
(163) 0xae10 MOV (%RDX,%R10,8),%RAX |
(163) 0xae14 VMOVSD (%RCX,%RAX,8),%XMM2 |
(163) 0xae19 VFNMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(163) 0xae1f INC %R10 |
(163) 0xae22 CMP %R10,%R9 |
(163) 0xae25 JNE ae10 |
(162) 0xae27 JMP ad40 |
0xae2c NOPW %CS:(%RAX,%RAX,1) |
0xae3b NOPL (%RAX,%RAX,1) |
0xae40 CMP %R13,%R12 |
0xae43 JGE b340 |
0xae49 MOV %R12,%RAX |
0xae4c NOT %RAX |
0xae4f ADD %RAX,%R13 |
0xae52 XOR %EDI,%EDI |
0xae54 VMOVDDUP 0x51c4(%RIP),%XMM1 |
0xae5c MOV %R13,-0x30(%RBP) |
0xae60 JMP ae9b |
0xae62 NOPW %CS:(%RAX,%RAX,1) |
0xae71 NOPW %CS:(%RAX,%RAX,1) |
(168) 0xae80 VMULSD %XMM0,%XMM2,%XMM2 |
(168) 0xae84 MOV 0x30(%RBP),%RAX |
(168) 0xae88 VMOVSD %XMM2,(%RAX,%R8,8) |
(168) 0xae8e CMP %R13,%RDI |
(168) 0xae91 LEA 0x1(%RDI),%RDI |
(168) 0xae95 JE b340 |
(168) 0xae9b LEA (%R12,%RDI,1),%R8 |
(168) 0xae9f VMOVSD (%RSI,%R8,8),%XMM2 |
(168) 0xaea5 VXORPD %XMM1,%XMM2,%XMM2 |
(168) 0xaea9 MOV (%RBX,%R8,8),%R11 |
(168) 0xaead MOV 0x8(%RBX,%R8,8),%R9 |
(168) 0xaeb2 MOV %R9,%R15 |
(168) 0xaeb5 SUB %R11,%R15 |
(168) 0xaeb8 JLE ae80 |
(168) 0xaeba MOV %R15,%R10 |
(168) 0xaebd AND $-0x4,%R10 |
(168) 0xaec1 JE af40 |
(168) 0xaec7 LEA -0x1(%R10),%R12 |
(168) 0xaecb LEA (%R14,%R11,8),%R13 |
(168) 0xaecf LEA (%RDX,%R11,8),%RSI |
(168) 0xaed3 VXORPD %XMM3,%XMM3,%XMM3 |
(168) 0xaed7 XOR %EAX,%EAX |
(168) 0xaed9 NOPL (%RAX) |
(170) 0xaee0 VMOVUPD (%RSI,%RAX,8),%YMM4 |
(170) 0xaee5 VXORPD %XMM5,%XMM5,%XMM5 |
(170) 0xaee9 KXNORW %K0,%K0,%K1 |
(170) 0xaeed VGATHERQPD (%RCX,%YMM4,8),%YMM5{%K1} |
(170) 0xaef4 VFMADD231PD (%R13,%RAX,8),%YMM5,%YMM3 |
(170) 0xaefb ADD $0x4,%RAX |
(170) 0xaeff CMP %R12,%RAX |
(170) 0xaf02 JBE aee0 |
(168) 0xaf04 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(168) 0xaf0a VADDPD %XMM4,%XMM3,%XMM3 |
(168) 0xaf0e VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(168) 0xaf13 VADDSD %XMM4,%XMM3,%XMM3 |
(168) 0xaf17 VADDSD %XMM3,%XMM2,%XMM2 |
(168) 0xaf1b CMP %R10,%R15 |
(168) 0xaf1e MOV -0x30(%RBP),%R13 |
(168) 0xaf22 MOV -0x38(%RBP),%R12 |
(168) 0xaf26 MOV 0x28(%RBP),%RSI |
(168) 0xaf2a JE ae80 |
(168) 0xaf30 JMP af43 |
0xaf32 NOPW %CS:(%RAX,%RAX,1) |
(168) 0xaf40 XOR %R10D,%R10D |
(168) 0xaf43 ADD %R11,%R10 |
(168) 0xaf46 NOPW %CS:(%RAX,%RAX,1) |
(169) 0xaf50 MOV (%RDX,%R10,8),%RAX |
(169) 0xaf54 VMOVSD (%RCX,%RAX,8),%XMM3 |
(169) 0xaf59 VFMADD231SD (%R14,%R10,8),%XMM3,%XMM2 |
(169) 0xaf5f INC %R10 |
(169) 0xaf62 CMP %R10,%R9 |
(169) 0xaf65 JNE af50 |
(168) 0xaf67 JMP ae80 |
0xaf6c NOPW %CS:(%RAX,%RAX,1) |
0xaf7b NOPL (%RAX,%RAX,1) |
0xaf80 VUCOMISD 0x5090(%RIP),%XMM0 |
0xaf88 JNE b200 |
0xaf8e CMP %R13,%R12 |
0xaf91 JGE b340 |
0xaf97 VXORPD 0x507f(%RIP){1to2},%XMM5,%XMM0 |
0xafa1 MOV %R12,%RAX |
0xafa4 NOT %RAX |
0xafa7 ADD %RAX,%R13 |
0xafaa XOR %EDI,%EDI |
0xafac MOV %R13,-0x30(%RBP) |
0xafb0 JMP afd7 |
0xafb2 NOPW %CS:(%RAX,%RAX,1) |
(153) 0xafc0 MOV 0x30(%RBP),%RAX |
(153) 0xafc4 VMOVSD %XMM1,(%RAX,%R8,8) |
(153) 0xafca CMP %R13,%RDI |
(153) 0xafcd LEA 0x1(%RDI),%RDI |
(153) 0xafd1 JE b340 |
(153) 0xafd7 LEA (%R12,%RDI,1),%R8 |
(153) 0xafdb VMULSD (%RSI,%R8,8),%XMM0,%XMM1 |
(153) 0xafe1 MOV (%RBX,%R8,8),%R11 |
(153) 0xafe5 MOV 0x8(%RBX,%R8,8),%R9 |
(153) 0xafea MOV %R9,%R15 |
(153) 0xafed SUB %R11,%R15 |
(153) 0xaff0 JLE afc0 |
(153) 0xaff2 MOV %R15,%R10 |
(153) 0xaff5 AND $-0x4,%R10 |
(153) 0xaff9 JE b080 |
(153) 0xafff LEA -0x1(%R10),%R12 |
(153) 0xb003 LEA (%R14,%R11,8),%R13 |
(153) 0xb007 LEA (%RDX,%R11,8),%RSI |
(153) 0xb00b VXORPD %XMM2,%XMM2,%XMM2 |
(153) 0xb00f XOR %EAX,%EAX |
(153) 0xb011 NOPW %CS:(%RAX,%RAX,1) |
(155) 0xb020 VMOVUPD (%RSI,%RAX,8),%YMM3 |
(155) 0xb025 VXORPD %XMM4,%XMM4,%XMM4 |
(155) 0xb029 KXNORW %K0,%K0,%K1 |
(155) 0xb02d VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(155) 0xb034 VFNMADD231PD (%R13,%RAX,8),%YMM4,%YMM2 |
(155) 0xb03b ADD $0x4,%RAX |
(155) 0xb03f CMP %R12,%RAX |
(155) 0xb042 JBE b020 |
(153) 0xb044 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(153) 0xb04a VADDPD %XMM3,%XMM2,%XMM2 |
(153) 0xb04e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(153) 0xb053 VADDSD %XMM3,%XMM2,%XMM2 |
(153) 0xb057 VADDSD %XMM2,%XMM1,%XMM1 |
(153) 0xb05b CMP %R10,%R15 |
(153) 0xb05e MOV -0x30(%RBP),%R13 |
(153) 0xb062 MOV -0x38(%RBP),%R12 |
(153) 0xb066 MOV 0x28(%RBP),%RSI |
(153) 0xb06a JE afc0 |
(153) 0xb070 JMP b083 |
0xb072 NOPW %CS:(%RAX,%RAX,1) |
(153) 0xb080 XOR %R10D,%R10D |
(153) 0xb083 ADD %R11,%R10 |
(153) 0xb086 NOPW %CS:(%RAX,%RAX,1) |
(154) 0xb090 MOV (%RDX,%R10,8),%RAX |
(154) 0xb094 VMOVSD (%RCX,%RAX,8),%XMM2 |
(154) 0xb099 VFNMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(154) 0xb09f INC %R10 |
(154) 0xb0a2 CMP %R10,%R9 |
(154) 0xb0a5 JNE b090 |
(153) 0xb0a7 JMP afc0 |
0xb0ac NOPW %CS:(%RAX,%RAX,1) |
0xb0bb NOPL (%RAX,%RAX,1) |
0xb0c0 CMP %R13,%R12 |
0xb0c3 JGE b340 |
0xb0c9 MOV %R12,%RAX |
0xb0cc NOT %RAX |
0xb0cf ADD %RAX,%R13 |
0xb0d2 XOR %EDI,%EDI |
0xb0d4 MOV %R13,-0x30(%RBP) |
0xb0d8 JMP b11b |
0xb0da NOPW %CS:(%RAX,%RAX,1) |
0xb0e9 NOPW %CS:(%RAX,%RAX,1) |
0xb0f8 NOPL (%RAX,%RAX,1) |
(159) 0xb100 VMULSD %XMM0,%XMM1,%XMM1 |
(159) 0xb104 MOV 0x30(%RBP),%RAX |
(159) 0xb108 VMOVSD %XMM1,(%RAX,%R8,8) |
(159) 0xb10e CMP %R13,%RDI |
(159) 0xb111 LEA 0x1(%RDI),%RDI |
(159) 0xb115 JE b340 |
(159) 0xb11b LEA (%R12,%RDI,1),%R8 |
(159) 0xb11f VMOVSD (%RSI,%R8,8),%XMM1 |
(159) 0xb125 MOV (%RBX,%R8,8),%R11 |
(159) 0xb129 MOV 0x8(%RBX,%R8,8),%R9 |
(159) 0xb12e MOV %R9,%R15 |
(159) 0xb131 SUB %R11,%R15 |
(159) 0xb134 JLE b100 |
(159) 0xb136 MOV %R15,%R10 |
(159) 0xb139 AND $-0x4,%R10 |
(159) 0xb13d JE b1c0 |
(159) 0xb143 LEA -0x1(%R10),%R12 |
(159) 0xb147 LEA (%R14,%R11,8),%R13 |
(159) 0xb14b LEA (%RDX,%R11,8),%RSI |
(159) 0xb14f VXORPD %XMM2,%XMM2,%XMM2 |
(159) 0xb153 XOR %EAX,%EAX |
(159) 0xb155 NOPW %CS:(%RAX,%RAX,1) |
(161) 0xb160 VMOVUPD (%RSI,%RAX,8),%YMM3 |
(161) 0xb165 KXNORW %K0,%K0,%K1 |
(161) 0xb169 VXORPD %XMM4,%XMM4,%XMM4 |
(161) 0xb16d VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(161) 0xb174 VFMADD231PD (%R13,%RAX,8),%YMM4,%YMM2 |
(161) 0xb17b ADD $0x4,%RAX |
(161) 0xb17f CMP %R12,%RAX |
(161) 0xb182 JBE b160 |
(159) 0xb184 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(159) 0xb18a VADDPD %XMM3,%XMM2,%XMM2 |
(159) 0xb18e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(159) 0xb193 VADDSD %XMM3,%XMM2,%XMM2 |
(159) 0xb197 VADDSD %XMM2,%XMM1,%XMM1 |
(159) 0xb19b CMP %R10,%R15 |
(159) 0xb19e MOV -0x30(%RBP),%R13 |
(159) 0xb1a2 MOV -0x38(%RBP),%R12 |
(159) 0xb1a6 MOV 0x28(%RBP),%RSI |
(159) 0xb1aa JE b100 |
(159) 0xb1b0 JMP b1c3 |
0xb1b2 NOPW %CS:(%RAX,%RAX,1) |
(159) 0xb1c0 XOR %R10D,%R10D |
(159) 0xb1c3 ADD %R11,%R10 |
(159) 0xb1c6 NOPW %CS:(%RAX,%RAX,1) |
(160) 0xb1d0 MOV (%RDX,%R10,8),%RAX |
(160) 0xb1d4 VMOVSD (%RCX,%RAX,8),%XMM2 |
(160) 0xb1d9 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(160) 0xb1df INC %R10 |
(160) 0xb1e2 CMP %R10,%R9 |
(160) 0xb1e5 JNE b1d0 |
(159) 0xb1e7 JMP b100 |
0xb1ec NOPW %CS:(%RAX,%RAX,1) |
0xb1fb NOPL (%RAX,%RAX,1) |
0xb200 CMP %R13,%R12 |
0xb203 JGE b340 |
0xb209 MOV %R12,%RAX |
0xb20c NOT %RAX |
0xb20f ADD %RAX,%R13 |
0xb212 XOR %EDI,%EDI |
0xb214 JMP b25b |
0xb216 NOPW %CS:(%RAX,%RAX,1) |
0xb225 NOPW %CS:(%RAX,%RAX,1) |
0xb234 NOPW %CS:(%RAX,%RAX,1) |
(150) 0xb240 VMULSD %XMM0,%XMM1,%XMM1 |
(150) 0xb244 MOV 0x30(%RBP),%RAX |
(150) 0xb248 VMOVSD %XMM1,(%RAX,%R8,8) |
(150) 0xb24e CMP %R13,%RDI |
(150) 0xb251 LEA 0x1(%RDI),%RDI |
(150) 0xb255 JE b340 |
(150) 0xb25b LEA (%R12,%RDI,1),%R8 |
(150) 0xb25f VMULSD (%RSI,%R8,8),%XMM5,%XMM1 |
(150) 0xb265 MOV (%RBX,%R8,8),%R11 |
(150) 0xb269 MOV 0x8(%RBX,%R8,8),%R9 |
(150) 0xb26e MOV %R9,%R15 |
(150) 0xb271 SUB %R11,%R15 |
(150) 0xb274 JLE b240 |
(150) 0xb276 MOV %R15,%R10 |
(150) 0xb279 AND $-0x4,%R10 |
(150) 0xb27d JE b300 |
(150) 0xb283 MOV %R13,%RAX |
(150) 0xb286 LEA -0x1(%R10),%R12 |
(150) 0xb28a LEA (%R14,%R11,8),%R13 |
(150) 0xb28e MOV %R11,-0x30(%RBP) |
(150) 0xb292 LEA (%RDX,%R11,8),%RSI |
(150) 0xb296 VXORPD %XMM2,%XMM2,%XMM2 |
(150) 0xb29a XOR %R11D,%R11D |
(150) 0xb29d NOPL (%RAX) |
(152) 0xb2a0 VMOVUPD (%RSI,%R11,8),%YMM3 |
(152) 0xb2a6 VXORPD %XMM4,%XMM4,%XMM4 |
(152) 0xb2aa KXNORW %K0,%K0,%K1 |
(152) 0xb2ae VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(152) 0xb2b5 VFMADD231PD (%R13,%R11,8),%YMM4,%YMM2 |
(152) 0xb2bc ADD $0x4,%R11 |
(152) 0xb2c0 CMP %R12,%R11 |
(152) 0xb2c3 JBE b2a0 |
(150) 0xb2c5 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(150) 0xb2cb VADDPD %XMM3,%XMM2,%XMM2 |
(150) 0xb2cf VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(150) 0xb2d4 VADDSD %XMM3,%XMM2,%XMM2 |
(150) 0xb2d8 VADDSD %XMM2,%XMM1,%XMM1 |
(150) 0xb2dc CMP %R10,%R15 |
(150) 0xb2df MOV %RAX,%R13 |
(150) 0xb2e2 MOV -0x38(%RBP),%R12 |
(150) 0xb2e6 MOV 0x28(%RBP),%RSI |
(150) 0xb2ea MOV -0x30(%RBP),%R11 |
(150) 0xb2ee JE b240 |
(150) 0xb2f4 JMP b303 |
0xb2f6 NOPW %CS:(%RAX,%RAX,1) |
(150) 0xb300 XOR %R10D,%R10D |
(150) 0xb303 ADD %R11,%R10 |
(150) 0xb306 NOPW %CS:(%RAX,%RAX,1) |
(151) 0xb310 MOV (%RDX,%R10,8),%RAX |
(151) 0xb314 VMOVSD (%RCX,%RAX,8),%XMM2 |
(151) 0xb319 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(151) 0xb31f INC %R10 |
(151) 0xb322 CMP %R10,%R9 |
(151) 0xb325 JNE b310 |
(150) 0xb327 JMP b240 |
0xb32c NOPW %CS:(%RAX,%RAX,1) |
0xb33b NOPL (%RAX,%RAX,1) |
0xb340 ADD $0x28,%RSP |
0xb344 POP %RBX |
0xb345 POP %R12 |
0xb347 POP %R13 |
0xb349 POP %R14 |
0xb34b POP %R15 |
0xb34d POP %RBP |
0xb34e VZEROUPPER |
0xb351 RET |
0xb352 NOPW %CS:(%RAX,%RAX,1) |
0xb35c NOPL (%RAX) |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | libseq_mv.so |
nb instructions | 346 |
nb uops | 383 |
loop length | 1853 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 9 |
micro-operation queue | 63.83 cycles |
front end | 63.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 28.50 | 25.60 | 14.67 | 14.67 | 16.00 | 25.80 | 28.50 | 16.00 | 16.00 | 16.00 | 25.60 | 14.67 |
cycles | 28.50 | 27.20 | 14.67 | 14.67 | 16.00 | 25.80 | 28.50 | 16.00 | 16.00 | 16.00 | 25.60 | 14.67 |
Cycles executing div or sqrt instructions | 32.00 |
FE+BE cycles | 60.87-60.92 |
Stall cycles | 0.00 |
Front-end | 63.83 |
Dispatch | 28.50 |
DIV/SQRT | 32.00 |
Overall L1 | 63.83 |
all | 1% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 10% |
load | 5% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 4% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 3% |
all | 10% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 13% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R13),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R12,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE a280 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
DEC %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RBX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JLE a290 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE a298 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RBX,%R13,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %R15,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
SUB %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAR $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP a298 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
DEC %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RBX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JG a220 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x60> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVQ $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE a300 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x140> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x38(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JS a310 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x150> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JG a340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JG a36e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1ae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x18(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNS a3ae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP a3b3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1f3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x38(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNS a2c8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x108> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE a2d9 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x119> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP a36e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1ae> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RBX,%R13,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %R15,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RBX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAR $0x3,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE a2d9 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x119> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xac6b(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x5fee(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x5f8f(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x5efe(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS a3b3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1f3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE a3ea <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x22a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xac26(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x5fa9(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x5f59(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x5eb9(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R13,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS a3f9 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x239> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE a435 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x275> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xabe0(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x5f63(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x5f35(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x5e73(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD -0x30(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE a580 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x3c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x5bb8(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE a6c0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x500> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP a496 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x2d6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x28(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x5a8c(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE a800 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x640> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x5a76(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE a940 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x780> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x5a64(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP a5d7 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x417> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x5950(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE aa80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP a716 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x556> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x5808(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE abc0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x57fa(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE ad00 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb40> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP a857 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x697> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x56d0(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE ae40 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP a997 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7d7> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP aada <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x91a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x5448(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE af80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdc0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP ac17 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa57> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x5310(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE b0c0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xf00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x52f6(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP ad57 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb97> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x51c4(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP ae9b <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcdb> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x5090(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE b200 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1040> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x507f(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP afd7 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe17> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP b11b <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xf5b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP b25b <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x109b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matvec.c:243-404 |
Module | libseq_mv.so |
nb instructions | 346 |
nb uops | 383 |
loop length | 1853 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 9 |
micro-operation queue | 63.83 cycles |
front end | 63.83 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 28.50 | 25.60 | 14.67 | 14.67 | 16.00 | 25.80 | 28.50 | 16.00 | 16.00 | 16.00 | 25.60 | 14.67 |
cycles | 28.50 | 27.20 | 14.67 | 14.67 | 16.00 | 25.80 | 28.50 | 16.00 | 16.00 | 16.00 | 25.60 | 14.67 |
Cycles executing div or sqrt instructions | 32.00 |
FE+BE cycles | 60.87-60.92 |
Stall cycles | 0.00 |
Front-end | 63.83 |
Dispatch | 28.50 |
DIV/SQRT | 32.00 |
Overall L1 | 63.83 |
all | 1% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 10% |
load | 5% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 4% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 3% |
all | 10% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 13% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R13),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x10(%R13),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R12,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE a280 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
DEC %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RBX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JLE a290 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R13,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE a298 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x48(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RBX,%R13,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %R15,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
SUB %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAR $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP a298 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
DEC %R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV %RBX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JG a220 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x60> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVQ $0,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE a300 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x140> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x38(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JS a310 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x150> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R15,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JG a340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JG a36e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1ae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x18(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNS a3ae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1ee> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP a3b3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1f3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV -0x38(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNS a2c8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x108> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %R13D,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE a2d9 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x119> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP a36e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1ae> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x48(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RBX,%R13,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %R15,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RBX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RBX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x40(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAR $0x3,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE a2d9 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x119> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xac6b(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x5fee(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x5f8f(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x5efe(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS a3b3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1f3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE a3ea <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x22a> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xac26(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x5fa9(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x5f59(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x5eb9(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R13,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS a3f9 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x239> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE a435 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x275> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xabe0(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x5f63(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x5f35(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x5e73(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD -0x30(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE a580 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x3c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x5bb8(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE a6c0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x500> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP a496 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x2d6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x28(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x5a8c(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE a800 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x640> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x5a76(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE a940 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x780> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x5a64(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP a5d7 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x417> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x5950(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE aa80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8c0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP a716 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x556> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x5808(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE abc0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x57fa(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE ad00 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb40> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP a857 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x697> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x56d0(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE ae40 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc80> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP a997 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7d7> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP aada <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x91a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x5448(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE af80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdc0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP ac17 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa57> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x5310(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE b0c0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xf00> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x52f6(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP ad57 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb97> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x51c4(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP ae9b <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcdb> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x5090(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE b200 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1040> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x507f(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP afd7 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe17> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP b11b <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xf5b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE b340 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1180> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP b25b <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x109b> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted– | 14.93 | 3.66 |
▼Loop 165 - csr_matvec.c:334-341 - libseq_mv.so– | 1.05 | 0.21 |
○Loop 167 - csr_matvec.c:337-339 - libseq_mv.so | 0.16 | 0.03 |
○Loop 166 - csr_matvec.c:337-339 - libseq_mv.so | 0 | 0 |
▼Loop 171 - csr_matvec.c:307-314 - libseq_mv.so– | 0.77 | 0.15 |
○Loop 173 - csr_matvec.c:310-312 - libseq_mv.so | 5.22 | 1.05 |
○Loop 172 - csr_matvec.c:310-312 - libseq_mv.so | 0.89 | 0.18 |
▼Loop 183 - csr_matvec.c:256-263 - libseq_mv.so– | 0.76 | 0.15 |
○Loop 185 - csr_matvec.c:259-261 - libseq_mv.so | 4.63 | 0.93 |
○Loop 184 - csr_matvec.c:259-261 - libseq_mv.so | 0.84 | 0.17 |
▼Loop 168 - csr_matvec.c:319-326 - libseq_mv.so– | 0 | 0 |
○Loop 169 - csr_matvec.c:322-324 - libseq_mv.so | 0 | 0 |
○Loop 170 - csr_matvec.c:322-324 - libseq_mv.so | 0 | 0 |
▼Loop 150 - csr_matvec.c:397-404 - libseq_mv.so– | 0 | 0 |
○Loop 152 - csr_matvec.c:400-402 - libseq_mv.so | 0 | 0 |
○Loop 151 - csr_matvec.c:400-402 - libseq_mv.so | 0 | 0 |
▼Loop 174 - csr_matvec.c:295-302 - libseq_mv.so– | 0 | 0.01 |
○Loop 176 - csr_matvec.c:298-300 - libseq_mv.so | 0.19 | 0.04 |
○Loop 175 - csr_matvec.c:298-300 - libseq_mv.so | 0.18 | 0.04 |
▼Loop 153 - csr_matvec.c:385-392 - libseq_mv.so– | 0 | 0 |
○Loop 154 - csr_matvec.c:388-390 - libseq_mv.so | 0 | 0 |
○Loop 155 - csr_matvec.c:388-390 - libseq_mv.so | 0 | 0 |
▼Loop 159 - csr_matvec.c:358-365 - libseq_mv.so– | 0 | 0 |
○Loop 161 - csr_matvec.c:361-363 - libseq_mv.so | 0 | 0 |
○Loop 160 - csr_matvec.c:361-363 - libseq_mv.so | 0 | 0 |
▼Loop 180 - csr_matvec.c:268-275 - libseq_mv.so– | 0 | 0 |
○Loop 181 - csr_matvec.c:271-273 - libseq_mv.so | 0 | 0 |
○Loop 182 - csr_matvec.c:271-273 - libseq_mv.so | 0 | 0 |
▼Loop 162 - csr_matvec.c:346-353 - libseq_mv.so– | 0 | 0 |
○Loop 164 - csr_matvec.c:349-351 - libseq_mv.so | 0 | 0 |
○Loop 163 - csr_matvec.c:349-351 - libseq_mv.so | 0 | 0 |
▼Loop 156 - csr_matvec.c:373-380 - libseq_mv.so– | 0 | 0 |
○Loop 158 - csr_matvec.c:376-378 - libseq_mv.so | 0 | 0 |
○Loop 157 - csr_matvec.c:376-378 - libseq_mv.so | 0 | 0 |
▼Loop 177 - csr_matvec.c:280-287 - libseq_mv.so– | 0 | 0 |
○Loop 178 - csr_matvec.c:283-285 - libseq_mv.so | 0 | 0 |
○Loop 179 - csr_matvec.c:283-285 - libseq_mv.so | 0 | 0 |