Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: libseq_mv.so | Source: csr_matvec.c:243-404 [...] | Coverage: 17.95% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: libseq_mv.so | Source: csr_matvec.c:243-404 [...] | Coverage: 17.95% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-147-2675/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
/home/eoseret/qaas_runs_CPU_9468/171-147-2675/intel/AMG/build/AMG/AMG/seq_mv/csr_matrix.c: 645 - 674 |
-------------------------------------------------------------------------------- |
645: HYPRE_Int num_nonzerosA = hypre_CSRMatrixNumNonzeros(A); |
646: HYPRE_Int num_rowsA = hypre_CSRMatrixNumRows(A); |
647: HYPRE_Int *A_i = hypre_CSRMatrixI(A); |
648: |
649: HYPRE_Int num_threads = hypre_NumActiveThreads(); |
650: |
651: HYPRE_Int nonzeros_per_thread = (num_nonzerosA + num_threads - 1)/num_threads; |
652: |
653: if (idx <= 0) |
654: { |
655: return 0; |
656: } |
657: else if (idx >= num_threads) |
[...] |
663: return (HYPRE_Int)(hypre_LowerBound(A_i, A_i + num_rowsA, nonzeros_per_thread*idx) - A_i); |
[...] |
669: return hypre_CSRMatrixGetLoadBalancedPartitionBoundary(A, hypre_GetThreadNum()); |
670: } |
671: |
672: HYPRE_Int hypre_CSRMatrixGetLoadBalancedPartitionEnd(hypre_CSRMatrix *A) |
673: { |
674: return hypre_CSRMatrixGetLoadBalancedPartitionBoundary(A, hypre_GetThreadNum() + 1); |
0x7ba0 PUSH %RBP |
0x7ba1 MOV %RSP,%RBP |
0x7ba4 PUSH %R15 |
0x7ba6 PUSH %R14 |
0x7ba8 PUSH %R13 |
0x7baa PUSH %R12 |
0x7bac PUSH %RBX |
0x7bad SUB $0x28,%RSP |
0x7bb1 MOV %R9,-0x30(%RBP) |
0x7bb5 MOV %R8,-0x48(%RBP) |
0x7bb9 MOV %RCX,%R15 |
0x7bbc MOV %RDX,%R13 |
0x7bbf CALL 3080 <hypre_GetThreadNum@plt> |
0x7bc4 MOV %RAX,%RBX |
0x7bc7 MOV 0x20(%R15),%R14 |
0x7bcb MOV (%R15),%R12 |
0x7bce MOV 0x10(%R15),%RAX |
0x7bd2 MOV %RAX,-0x40(%RBP) |
0x7bd6 CALL 3170 <hypre_NumActiveThreads@plt> |
0x7bdb MOV %RAX,%RCX |
0x7bde LEA -0x1(%R14,%RAX,1),%RAX |
0x7be3 MOV %RAX,%RDX |
0x7be6 OR %RCX,%RDX |
0x7be9 SHR $0x20,%RDX |
0x7bed JE 7c22 |
0x7bef CQTO |
0x7bf1 IDIV %RCX |
0x7bf4 TEST %RBX,%RBX |
0x7bf7 JLE 7c2b |
0x7bf9 CMP %RBX,%RCX |
0x7bfc JLE 7c33 |
0x7bfe MOV -0x40(%RBP),%RCX |
0x7c02 LEA (%R12,%RCX,8),%RSI |
0x7c06 IMUL %RBX,%RAX |
0x7c0a MOV %R12,%RDI |
0x7c0d MOV %RAX,%RDX |
0x7c10 CALL 3140 <hypre_LowerBound@plt> |
0x7c15 SUB %R12,%RAX |
0x7c18 SAR $0x3,%RAX |
0x7c1c MOV %RAX,-0x40(%RBP) |
0x7c20 JMP 7c33 |
0x7c22 XOR %EDX,%EDX |
0x7c24 DIV %ECX |
0x7c26 TEST %RBX,%RBX |
0x7c29 JG 7bf9 |
0x7c2b MOVQ $0,-0x40(%RBP) |
0x7c33 CALL 3080 <hypre_GetThreadNum@plt> |
0x7c38 MOV %RAX,%RBX |
0x7c3b MOV 0x20(%R15),%R14 |
0x7c3f MOV (%R15),%R12 |
0x7c42 MOV 0x10(%R15),%R15 |
0x7c46 CALL 3170 <hypre_NumActiveThreads@plt> |
0x7c4b MOV %RAX,%RCX |
0x7c4e LEA -0x1(%R14,%RAX,1),%RAX |
0x7c53 MOV %RAX,%RDX |
0x7c56 OR %RCX,%RDX |
0x7c59 SHR $0x20,%RDX |
0x7c5d JE 7c66 |
0x7c5f CQTO |
0x7c61 IDIV %RCX |
0x7c64 JMP 7c6a |
0x7c66 XOR %EDX,%EDX |
0x7c68 DIV %ECX |
0x7c6a MOV -0x40(%RBP),%R14 |
0x7c6e TEST %RBX,%RBX |
0x7c71 JS 7e9d |
0x7c77 INC %RBX |
0x7c7a CMP %RBX,%RCX |
0x7c7d JLE 7c9c |
0x7c7f LEA (%R12,%R15,8),%RSI |
0x7c83 IMUL %RBX,%RAX |
0x7c87 MOV %R12,%RDI |
0x7c8a MOV %RAX,%RDX |
0x7c8d CALL 3140 <hypre_LowerBound@plt> |
0x7c92 MOV %RAX,%R15 |
0x7c95 SUB %R12,%R15 |
0x7c98 SAR $0x3,%R15 |
0x7c9c CMP %R15,%R14 |
0x7c9f JLE 7cd8 |
0x7ca1 MOV 0x9338(%RIP),%RAX |
0x7ca8 MOV (%RAX),%RDI |
0x7cab LEA 0x46bb(%RIP),%RSI |
0x7cb2 LEA 0x465c(%RIP),%RDX |
0x7cb9 XOR %EAX,%EAX |
0x7cbb CALL 31e0 <hypre_fprintf@plt> |
0x7cc0 LEA 0x45cb(%RIP),%RDI |
0x7cc7 MOV $0xf8,%ESI |
0x7ccc MOV $0x1,%EDX |
0x7cd1 XOR %ECX,%ECX |
0x7cd3 CALL 3220 <hypre_error_handler@plt> |
0x7cd8 MOV 0x18(%RBP),%RBX |
0x7cdc TEST %R14,%R14 |
0x7cdf JS 7ce6 |
0x7ce1 CMP %RBX,%R14 |
0x7ce4 JLE 7d1d |
0x7ce6 MOV 0x92f3(%RIP),%RAX |
0x7ced MOV (%RAX),%RDI |
0x7cf0 LEA 0x4676(%RIP),%RSI |
0x7cf7 LEA 0x4626(%RIP),%RDX |
0x7cfe XOR %EAX,%EAX |
0x7d00 CALL 31e0 <hypre_fprintf@plt> |
0x7d05 LEA 0x4586(%RIP),%RDI |
0x7d0c MOV $0xf9,%ESI |
0x7d11 MOV $0x1,%EDX |
0x7d16 XOR %ECX,%ECX |
0x7d18 CALL 3220 <hypre_error_handler@plt> |
0x7d1d VMOVSD 0x38(%RBP),%XMM5 |
0x7d22 TEST %R15,%R15 |
0x7d25 JS 7d2c |
0x7d27 CMP %RBX,%R15 |
0x7d2a JLE 7d68 |
0x7d2c MOV 0x92ad(%RIP),%RAX |
0x7d33 MOV (%RAX),%RDI |
0x7d36 LEA 0x4630(%RIP),%RSI |
0x7d3d LEA 0x4602(%RIP),%RDX |
0x7d44 XOR %EAX,%EAX |
0x7d46 CALL 31e0 <hypre_fprintf@plt> |
0x7d4b LEA 0x4540(%RIP),%RDI |
0x7d52 MOV $0xfa,%ESI |
0x7d57 MOV $0x1,%EDX |
0x7d5c XOR %ECX,%ECX |
0x7d5e CALL 3220 <hypre_error_handler@plt> |
0x7d63 VMOVSD 0x38(%RBP),%XMM5 |
0x7d68 MOV 0x30(%RBP),%RSI |
0x7d6c VMOVQ %R13,%XMM0 |
0x7d71 VXORPD %XMM1,%XMM1,%XMM1 |
0x7d75 VUCOMISD %XMM1,%XMM5 |
0x7d79 JNE 7eae |
0x7d7f VUCOMISD 0x4289(%RIP),%XMM0 |
0x7d87 JNE 7fec |
0x7d8d CMP %R15,%R14 |
0x7d90 JGE 8b5c |
0x7d96 MOV -0x30(%RBP),%RAX |
0x7d9a MOV (%RAX),%RDX |
0x7d9d MOV (%RSI),%RSI |
0x7da0 MOV %R14,%RAX |
0x7da3 NOT %RAX |
0x7da6 ADD %RAX,%R15 |
0x7da9 XOR %EDI,%EDI |
0x7dab MOV %R15,-0x30(%RBP) |
0x7daf MOV %RSI,-0x38(%RBP) |
0x7db3 JMP 7dd6 |
0x7db5 NOPW %CS:(%RAX,%RAX,1) |
(159) 0x7dc0 VMOVSD %XMM0,(%RSI,%R8,8) |
(159) 0x7dc6 LEA 0x1(%RDI),%RAX |
(159) 0x7dca CMP %R15,%RDI |
(159) 0x7dcd MOV %RAX,%RDI |
(159) 0x7dd0 JE 8b5c |
(159) 0x7dd6 LEA (%R14,%RDI,1),%R8 |
(159) 0x7dda MOV (%RDX,%R8,8),%R13 |
(159) 0x7dde MOV 0x8(%RDX,%R8,8),%R9 |
(159) 0x7de3 VXORPD %XMM0,%XMM0,%XMM0 |
(159) 0x7de7 MOV %R9,%RAX |
(159) 0x7dea SUB %R13,%RAX |
(159) 0x7ded JLE 7dc0 |
(159) 0x7def MOV -0x48(%RBP),%RCX |
(159) 0x7df3 MOV (%RCX),%R10 |
(159) 0x7df6 MOV 0x20(%RBP),%RCX |
(159) 0x7dfa MOV (%RCX),%R11 |
(159) 0x7dfd MOV 0x10(%RBP),%RCX |
(159) 0x7e01 MOV (%RCX),%RBX |
(159) 0x7e04 MOV %RAX,%R12 |
(159) 0x7e07 AND $-0x4,%R12 |
(159) 0x7e0b JE 7e6e |
(159) 0x7e0d LEA -0x1(%R12),%RCX |
(159) 0x7e12 LEA (%R10,%R13,8),%R14 |
(159) 0x7e16 LEA (%RBX,%R13,8),%R15 |
(159) 0x7e1a VXORPD %XMM0,%XMM0,%XMM0 |
(159) 0x7e1e XOR %ESI,%ESI |
(161) 0x7e20 VMOVUPD (%R15,%RSI,8),%YMM1 |
(161) 0x7e26 VXORPD %XMM2,%XMM2,%XMM2 |
(161) 0x7e2a KXNORW %K0,%K0,%K1 |
(161) 0x7e2e VGATHERQPD (%R11,%YMM1,8),%YMM2{%K1} |
(161) 0x7e35 VFMADD231PD (%R14,%RSI,8),%YMM2,%YMM0 |
(161) 0x7e3b ADD $0x4,%RSI |
(161) 0x7e3f CMP %RCX,%RSI |
(161) 0x7e42 JBE 7e20 |
(159) 0x7e44 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(159) 0x7e4a VADDPD %XMM1,%XMM0,%XMM0 |
(159) 0x7e4e VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(159) 0x7e53 VADDSD %XMM1,%XMM0,%XMM0 |
(159) 0x7e57 CMP %R12,%RAX |
(159) 0x7e5a MOV -0x40(%RBP),%R14 |
(159) 0x7e5e MOV -0x30(%RBP),%R15 |
(159) 0x7e62 MOV -0x38(%RBP),%RSI |
(159) 0x7e66 JE 7dc0 |
(159) 0x7e6c JMP 7e71 |
(159) 0x7e6e XOR %R12D,%R12D |
(159) 0x7e71 ADD %R13,%R12 |
(159) 0x7e74 NOPW %CS:(%RAX,%RAX,1) |
(160) 0x7e80 MOV (%RBX,%R12,8),%RAX |
(160) 0x7e84 VMOVSD (%R11,%RAX,8),%XMM1 |
(160) 0x7e8a VFMADD231SD (%R10,%R12,8),%XMM1,%XMM0 |
(160) 0x7e90 INC %R12 |
(160) 0x7e93 CMP %R12,%R9 |
(160) 0x7e96 JNE 7e80 |
(159) 0x7e98 JMP 7dc0 |
0x7e9d XOR %R15D,%R15D |
0x7ea0 CMP %R15,%R14 |
0x7ea3 JG 7ca1 |
0x7ea9 JMP 7cd8 |
0x7eae MOV 0x28(%RBP),%RCX |
0x7eb2 VUCOMISD 0x415e(%RIP),%XMM5 |
0x7eba JNE 810d |
0x7ec0 VUCOMISD 0x4148(%RIP),%XMM0 |
0x7ec8 JNE 824c |
0x7ece CMP %R15,%R14 |
0x7ed1 JGE 8b5c |
0x7ed7 MOV -0x30(%RBP),%RAX |
0x7edb MOV (%RAX),%RDI |
0x7ede MOV (%RSI),%RSI |
0x7ee1 MOV %R14,%RAX |
0x7ee4 NOT %RAX |
0x7ee7 ADD %RAX,%R15 |
0x7eea XOR %R8D,%R8D |
0x7eed VMOVDDUP 0x412b(%RIP),%XMM0 |
0x7ef5 MOV %R15,-0x30(%RBP) |
0x7ef9 MOV %RSI,-0x38(%RBP) |
0x7efd JMP 7f16 |
0x7eff NOP |
(150) 0x7f00 VMOVSD %XMM1,(%RSI,%R9,8) |
(150) 0x7f06 LEA 0x1(%R8),%RAX |
(150) 0x7f0a CMP %R15,%R8 |
(150) 0x7f0d MOV %RAX,%R8 |
(150) 0x7f10 JE 8b5c |
(150) 0x7f16 LEA (%R14,%R8,1),%R9 |
(150) 0x7f1a VMOVSD (%RCX,%R9,8),%XMM1 |
(150) 0x7f20 VXORPD %XMM0,%XMM1,%XMM1 |
(150) 0x7f24 MOV (%RDI,%R9,8),%RDX |
(150) 0x7f28 MOV 0x8(%RDI,%R9,8),%R10 |
(150) 0x7f2d MOV %R10,%RAX |
(150) 0x7f30 SUB %RDX,%RAX |
(150) 0x7f33 JLE 7f00 |
(150) 0x7f35 MOV -0x48(%RBP),%RCX |
(150) 0x7f39 MOV (%RCX),%R11 |
(150) 0x7f3c MOV 0x20(%RBP),%RCX |
(150) 0x7f40 MOV (%RCX),%RBX |
(150) 0x7f43 MOV 0x10(%RBP),%RCX |
(150) 0x7f47 MOV (%RCX),%R12 |
(150) 0x7f4a MOV %RAX,%R13 |
(150) 0x7f4d AND $-0x4,%R13 |
(150) 0x7f51 JE 7fc6 |
(150) 0x7f53 LEA -0x1(%R13),%RCX |
(150) 0x7f57 LEA (%R11,%RDX,8),%R14 |
(150) 0x7f5b LEA (%R12,%RDX,8),%R15 |
(150) 0x7f5f VXORPD %XMM2,%XMM2,%XMM2 |
(150) 0x7f63 XOR %ESI,%ESI |
(150) 0x7f65 NOPW %CS:(%RAX,%RAX,1) |
(152) 0x7f70 VMOVUPD (%R15,%RSI,8),%YMM3 |
(152) 0x7f76 VXORPD %XMM4,%XMM4,%XMM4 |
(152) 0x7f7a KXNORW %K0,%K0,%K1 |
(152) 0x7f7e VGATHERQPD (%RBX,%YMM3,8),%YMM4{%K1} |
(152) 0x7f85 VFMADD231PD (%R14,%RSI,8),%YMM4,%YMM2 |
(152) 0x7f8b ADD $0x4,%RSI |
(152) 0x7f8f CMP %RCX,%RSI |
(152) 0x7f92 JBE 7f70 |
(150) 0x7f94 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(150) 0x7f9a VADDPD %XMM3,%XMM2,%XMM2 |
(150) 0x7f9e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(150) 0x7fa3 VADDSD %XMM3,%XMM2,%XMM2 |
(150) 0x7fa7 VADDSD %XMM2,%XMM1,%XMM1 |
(150) 0x7fab CMP %R13,%RAX |
(150) 0x7fae MOV -0x40(%RBP),%R14 |
(150) 0x7fb2 MOV -0x30(%RBP),%R15 |
(150) 0x7fb6 MOV 0x28(%RBP),%RCX |
(150) 0x7fba MOV -0x38(%RBP),%RSI |
(150) 0x7fbe JE 7f00 |
(150) 0x7fc4 JMP 7fcd |
(150) 0x7fc6 XOR %R13D,%R13D |
(150) 0x7fc9 MOV 0x28(%RBP),%RCX |
(150) 0x7fcd ADD %RDX,%R13 |
(151) 0x7fd0 MOV (%R12,%R13,8),%RAX |
(151) 0x7fd4 VMOVSD (%RBX,%RAX,8),%XMM2 |
(151) 0x7fd9 VFMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(151) 0x7fdf INC %R13 |
(151) 0x7fe2 CMP %R13,%R10 |
(151) 0x7fe5 JNE 7fd0 |
(150) 0x7fe7 JMP 7f00 |
0x7fec VUCOMISD 0x4024(%RIP),%XMM0 |
0x7ff4 JNE 837c |
0x7ffa CMP %R15,%R14 |
0x7ffd JGE 8b5c |
0x8003 MOV -0x30(%RBP),%RAX |
0x8007 MOV (%RAX),%RDX |
0x800a MOV (%RSI),%RSI |
0x800d MOV %R14,%RAX |
0x8010 NOT %RAX |
0x8013 ADD %RAX,%R15 |
0x8016 XOR %EDI,%EDI |
0x8018 MOV %R15,-0x30(%RBP) |
0x801c MOV %RSI,-0x38(%RBP) |
0x8020 JMP 8046 |
0x8022 NOPW %CS:(%RAX,%RAX,1) |
(156) 0x8030 VMOVSD %XMM0,(%RSI,%R8,8) |
(156) 0x8036 LEA 0x1(%RDI),%RAX |
(156) 0x803a CMP %R15,%RDI |
(156) 0x803d MOV %RAX,%RDI |
(156) 0x8040 JE 8b5c |
(156) 0x8046 LEA (%R14,%RDI,1),%R8 |
(156) 0x804a MOV (%RDX,%R8,8),%R13 |
(156) 0x804e MOV 0x8(%RDX,%R8,8),%R9 |
(156) 0x8053 VXORPD %XMM0,%XMM0,%XMM0 |
(156) 0x8057 MOV %R9,%RAX |
(156) 0x805a SUB %R13,%RAX |
(156) 0x805d JLE 8030 |
(156) 0x805f MOV -0x48(%RBP),%RCX |
(156) 0x8063 MOV (%RCX),%R10 |
(156) 0x8066 MOV 0x20(%RBP),%RCX |
(156) 0x806a MOV (%RCX),%R11 |
(156) 0x806d MOV 0x10(%RBP),%RCX |
(156) 0x8071 MOV (%RCX),%RBX |
(156) 0x8074 MOV %RAX,%R12 |
(156) 0x8077 AND $-0x4,%R12 |
(156) 0x807b JE 80de |
(156) 0x807d LEA -0x1(%R12),%RCX |
(156) 0x8082 LEA (%R10,%R13,8),%R14 |
(156) 0x8086 LEA (%RBX,%R13,8),%R15 |
(156) 0x808a VXORPD %XMM0,%XMM0,%XMM0 |
(156) 0x808e XOR %ESI,%ESI |
(158) 0x8090 VMOVUPD (%R15,%RSI,8),%YMM1 |
(158) 0x8096 KXNORW %K0,%K0,%K1 |
(158) 0x809a VXORPD %XMM2,%XMM2,%XMM2 |
(158) 0x809e VGATHERQPD (%R11,%YMM1,8),%YMM2{%K1} |
(158) 0x80a5 VFNMADD231PD (%R14,%RSI,8),%YMM2,%YMM0 |
(158) 0x80ab ADD $0x4,%RSI |
(158) 0x80af CMP %RCX,%RSI |
(158) 0x80b2 JBE 8090 |
(156) 0x80b4 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(156) 0x80ba VADDPD %XMM1,%XMM0,%XMM0 |
(156) 0x80be VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(156) 0x80c3 VADDSD %XMM1,%XMM0,%XMM0 |
(156) 0x80c7 CMP %R12,%RAX |
(156) 0x80ca MOV -0x40(%RBP),%R14 |
(156) 0x80ce MOV -0x30(%RBP),%R15 |
(156) 0x80d2 MOV -0x38(%RBP),%RSI |
(156) 0x80d6 JE 8030 |
(156) 0x80dc JMP 80e1 |
(156) 0x80de XOR %R12D,%R12D |
(156) 0x80e1 ADD %R13,%R12 |
(156) 0x80e4 NOPW %CS:(%RAX,%RAX,1) |
(157) 0x80f0 MOV (%RBX,%R12,8),%RAX |
(157) 0x80f4 VMOVSD (%R11,%RAX,8),%XMM1 |
(157) 0x80fa VFNMADD231SD (%R10,%R12,8),%XMM1,%XMM0 |
(157) 0x8100 INC %R12 |
(157) 0x8103 CMP %R12,%R9 |
(157) 0x8106 JNE 80f0 |
(156) 0x8108 JMP 8030 |
0x810d VUCOMISD 0x3efb(%RIP),%XMM5 |
0x8115 JNE 849d |
0x811b VUCOMISD 0x3eed(%RIP),%XMM0 |
0x8123 JNE 85cc |
0x8129 CMP %R15,%R14 |
0x812c JGE 8b5c |
0x8132 MOV -0x30(%RBP),%RAX |
0x8136 MOV (%RAX),%RDI |
0x8139 MOV (%RSI),%RSI |
0x813c MOV %R14,%RAX |
0x813f NOT %RAX |
0x8142 ADD %RAX,%R15 |
0x8145 XOR %R8D,%R8D |
0x8148 MOV %R15,-0x30(%RBP) |
0x814c MOV %RSI,-0x38(%RBP) |
0x8150 JMP 8176 |
0x8152 NOPW %CS:(%RAX,%RAX,1) |
(141) 0x8160 VMOVSD %XMM0,(%RSI,%R9,8) |
(141) 0x8166 LEA 0x1(%R8),%RAX |
(141) 0x816a CMP %R15,%R8 |
(141) 0x816d MOV %RAX,%R8 |
(141) 0x8170 JE 8b5c |
(141) 0x8176 LEA (%R14,%R8,1),%R9 |
(141) 0x817a VMOVSD (%RCX,%R9,8),%XMM0 |
(141) 0x8180 MOV (%RDI,%R9,8),%RDX |
(141) 0x8184 MOV 0x8(%RDI,%R9,8),%R10 |
(141) 0x8189 MOV %R10,%RAX |
(141) 0x818c SUB %RDX,%RAX |
(141) 0x818f JLE 8160 |
(141) 0x8191 MOV -0x48(%RBP),%RCX |
(141) 0x8195 MOV (%RCX),%R11 |
(141) 0x8198 MOV 0x20(%RBP),%RCX |
(141) 0x819c MOV (%RCX),%RBX |
(141) 0x819f MOV 0x10(%RBP),%RCX |
(141) 0x81a3 MOV (%RCX),%R12 |
(141) 0x81a6 MOV %RAX,%R13 |
(141) 0x81a9 AND $-0x4,%R13 |
(141) 0x81ad JE 8226 |
(141) 0x81af LEA -0x1(%R13),%RCX |
(141) 0x81b3 LEA (%R11,%RDX,8),%RSI |
(141) 0x81b7 LEA (%R12,%RDX,8),%R14 |
(141) 0x81bb VXORPD %XMM1,%XMM1,%XMM1 |
(141) 0x81bf XOR %R15D,%R15D |
(141) 0x81c2 NOPW %CS:(%RAX,%RAX,1) |
(143) 0x81d0 VMOVUPD (%R14,%R15,8),%YMM2 |
(143) 0x81d6 KXNORW %K0,%K0,%K1 |
(143) 0x81da VXORPD %XMM3,%XMM3,%XMM3 |
(143) 0x81de VGATHERQPD (%RBX,%YMM2,8),%YMM3{%K1} |
(143) 0x81e5 VFMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(143) 0x81eb ADD $0x4,%R15 |
(143) 0x81ef CMP %RCX,%R15 |
(143) 0x81f2 JBE 81d0 |
(141) 0x81f4 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(141) 0x81fa VADDPD %XMM2,%XMM1,%XMM1 |
(141) 0x81fe VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(141) 0x8203 VADDSD %XMM2,%XMM1,%XMM1 |
(141) 0x8207 VADDSD %XMM1,%XMM0,%XMM0 |
(141) 0x820b CMP %R13,%RAX |
(141) 0x820e MOV -0x40(%RBP),%R14 |
(141) 0x8212 MOV -0x30(%RBP),%R15 |
(141) 0x8216 MOV 0x28(%RBP),%RCX |
(141) 0x821a MOV -0x38(%RBP),%RSI |
(141) 0x821e JE 8160 |
(141) 0x8224 JMP 822d |
(141) 0x8226 XOR %R13D,%R13D |
(141) 0x8229 MOV 0x28(%RBP),%RCX |
(141) 0x822d ADD %RDX,%R13 |
(142) 0x8230 MOV (%R12,%R13,8),%RAX |
(142) 0x8234 VMOVSD (%RBX,%RAX,8),%XMM1 |
(142) 0x8239 VFMADD231SD (%R11,%R13,8),%XMM1,%XMM0 |
(142) 0x823f INC %R13 |
(142) 0x8242 CMP %R13,%R10 |
(142) 0x8245 JNE 8230 |
(141) 0x8247 JMP 8160 |
0x824c VUCOMISD 0x3dc4(%RIP),%XMM0 |
0x8254 JNE 86fc |
0x825a CMP %R15,%R14 |
0x825d JGE 8b5c |
0x8263 MOV -0x30(%RBP),%RAX |
0x8267 MOV (%RAX),%RDI |
0x826a MOV (%RSI),%RSI |
0x826d MOV %R14,%RAX |
0x8270 NOT %RAX |
0x8273 ADD %RAX,%R15 |
0x8276 XOR %R8D,%R8D |
0x8279 MOV %R15,-0x30(%RBP) |
0x827d MOV %RSI,-0x38(%RBP) |
0x8281 JMP 82a6 |
0x8283 NOPW %CS:(%RAX,%RAX,1) |
(147) 0x8290 VMOVSD %XMM0,(%RSI,%R9,8) |
(147) 0x8296 LEA 0x1(%R8),%RAX |
(147) 0x829a CMP %R15,%R8 |
(147) 0x829d MOV %RAX,%R8 |
(147) 0x82a0 JE 8b5c |
(147) 0x82a6 LEA (%R14,%R8,1),%R9 |
(147) 0x82aa VMOVSD (%RCX,%R9,8),%XMM0 |
(147) 0x82b0 MOV (%RDI,%R9,8),%RDX |
(147) 0x82b4 MOV 0x8(%RDI,%R9,8),%R10 |
(147) 0x82b9 MOV %R10,%RAX |
(147) 0x82bc SUB %RDX,%RAX |
(147) 0x82bf JLE 8290 |
(147) 0x82c1 MOV -0x48(%RBP),%RCX |
(147) 0x82c5 MOV (%RCX),%R11 |
(147) 0x82c8 MOV 0x20(%RBP),%RCX |
(147) 0x82cc MOV (%RCX),%RBX |
(147) 0x82cf MOV 0x10(%RBP),%RCX |
(147) 0x82d3 MOV (%RCX),%R12 |
(147) 0x82d6 MOV %RAX,%R13 |
(147) 0x82d9 AND $-0x4,%R13 |
(147) 0x82dd JE 8356 |
(147) 0x82df LEA -0x1(%R13),%RCX |
(147) 0x82e3 LEA (%R11,%RDX,8),%RSI |
(147) 0x82e7 LEA (%R12,%RDX,8),%R14 |
(147) 0x82eb VXORPD %XMM1,%XMM1,%XMM1 |
(147) 0x82ef XOR %R15D,%R15D |
(147) 0x82f2 NOPW %CS:(%RAX,%RAX,1) |
(149) 0x8300 VMOVUPD (%R14,%R15,8),%YMM2 |
(149) 0x8306 VXORPD %XMM3,%XMM3,%XMM3 |
(149) 0x830a KXNORW %K0,%K0,%K1 |
(149) 0x830e VGATHERQPD (%RBX,%YMM2,8),%YMM3{%K1} |
(149) 0x8315 VFNMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(149) 0x831b ADD $0x4,%R15 |
(149) 0x831f CMP %RCX,%R15 |
(149) 0x8322 JBE 8300 |
(147) 0x8324 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(147) 0x832a VADDPD %XMM2,%XMM1,%XMM1 |
(147) 0x832e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(147) 0x8333 VADDSD %XMM2,%XMM1,%XMM1 |
(147) 0x8337 VADDSD %XMM1,%XMM0,%XMM0 |
(147) 0x833b CMP %R13,%RAX |
(147) 0x833e MOV -0x40(%RBP),%R14 |
(147) 0x8342 MOV -0x30(%RBP),%R15 |
(147) 0x8346 MOV 0x28(%RBP),%RCX |
(147) 0x834a MOV -0x38(%RBP),%RSI |
(147) 0x834e JE 8290 |
(147) 0x8354 JMP 835d |
(147) 0x8356 XOR %R13D,%R13D |
(147) 0x8359 MOV 0x28(%RBP),%RCX |
(147) 0x835d ADD %RDX,%R13 |
(148) 0x8360 MOV (%R12,%R13,8),%RAX |
(148) 0x8364 VMOVSD (%RBX,%RAX,8),%XMM1 |
(148) 0x8369 VFNMADD231SD (%R11,%R13,8),%XMM1,%XMM0 |
(148) 0x836f INC %R13 |
(148) 0x8372 CMP %R13,%R10 |
(148) 0x8375 JNE 8360 |
(147) 0x8377 JMP 8290 |
0x837c CMP %R15,%R14 |
0x837f JGE 8b5c |
0x8385 MOV -0x30(%RBP),%RAX |
0x8389 MOV (%RAX),%RDX |
0x838c MOV (%RSI),%RSI |
0x838f MOV %R14,%RAX |
0x8392 NOT %RAX |
0x8395 ADD %RAX,%R15 |
0x8398 XOR %EDI,%EDI |
0x839a MOV %R15,-0x30(%RBP) |
0x839e MOV %RSI,-0x38(%RBP) |
0x83a2 JMP 83ca |
0x83a4 NOPW %CS:(%RAX,%RAX,1) |
(153) 0x83b0 VMULSD %XMM0,%XMM1,%XMM1 |
(153) 0x83b4 VMOVSD %XMM1,(%RSI,%R8,8) |
(153) 0x83ba LEA 0x1(%RDI),%RAX |
(153) 0x83be CMP %R15,%RDI |
(153) 0x83c1 MOV %RAX,%RDI |
(153) 0x83c4 JE 8b5c |
(153) 0x83ca LEA (%R14,%RDI,1),%R8 |
(153) 0x83ce MOV (%RDX,%R8,8),%R13 |
(153) 0x83d2 MOV 0x8(%RDX,%R8,8),%R9 |
(153) 0x83d7 VXORPD %XMM1,%XMM1,%XMM1 |
(153) 0x83db MOV %R9,%RAX |
(153) 0x83de SUB %R13,%RAX |
(153) 0x83e1 JLE 83b0 |
(153) 0x83e3 MOV -0x48(%RBP),%RCX |
(153) 0x83e7 MOV (%RCX),%R10 |
(153) 0x83ea MOV 0x20(%RBP),%RCX |
(153) 0x83ee MOV (%RCX),%R11 |
(153) 0x83f1 MOV 0x10(%RBP),%RCX |
(153) 0x83f5 MOV (%RCX),%RBX |
(153) 0x83f8 MOV %RAX,%R12 |
(153) 0x83fb AND $-0x4,%R12 |
(153) 0x83ff JE 846e |
(153) 0x8401 LEA -0x1(%R12),%RCX |
(153) 0x8406 LEA (%R10,%R13,8),%R14 |
(153) 0x840a LEA (%RBX,%R13,8),%R15 |
(153) 0x840e VXORPD %XMM1,%XMM1,%XMM1 |
(153) 0x8412 XOR %ESI,%ESI |
(153) 0x8414 NOPW %CS:(%RAX,%RAX,1) |
(155) 0x8420 VMOVUPD (%R15,%RSI,8),%YMM2 |
(155) 0x8426 VXORPD %XMM3,%XMM3,%XMM3 |
(155) 0x842a KXNORW %K0,%K0,%K1 |
(155) 0x842e VGATHERQPD (%R11,%YMM2,8),%YMM3{%K1} |
(155) 0x8435 VFMADD231PD (%R14,%RSI,8),%YMM3,%YMM1 |
(155) 0x843b ADD $0x4,%RSI |
(155) 0x843f CMP %RCX,%RSI |
(155) 0x8442 JBE 8420 |
(153) 0x8444 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(153) 0x844a VADDPD %XMM2,%XMM1,%XMM1 |
(153) 0x844e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(153) 0x8453 VADDSD %XMM2,%XMM1,%XMM1 |
(153) 0x8457 CMP %R12,%RAX |
(153) 0x845a MOV -0x40(%RBP),%R14 |
(153) 0x845e MOV -0x30(%RBP),%R15 |
(153) 0x8462 MOV -0x38(%RBP),%RSI |
(153) 0x8466 JE 83b0 |
(153) 0x846c JMP 8471 |
(153) 0x846e XOR %R12D,%R12D |
(153) 0x8471 ADD %R13,%R12 |
(153) 0x8474 NOPW %CS:(%RAX,%RAX,1) |
(154) 0x8480 MOV (%RBX,%R12,8),%RAX |
(154) 0x8484 VMOVSD (%R11,%RAX,8),%XMM2 |
(154) 0x848a VFMADD231SD (%R10,%R12,8),%XMM2,%XMM1 |
(154) 0x8490 INC %R12 |
(154) 0x8493 CMP %R12,%R9 |
(154) 0x8496 JNE 8480 |
(153) 0x8498 JMP 83b0 |
0x849d VUCOMISD 0x3b6b(%RIP),%XMM0 |
0x84a5 JNE 881c |
0x84ab CMP %R15,%R14 |
0x84ae JGE 8b5c |
0x84b4 MOV -0x30(%RBP),%RAX |
0x84b8 MOV (%RAX),%RDI |
0x84bb MOV (%RSI),%RSI |
0x84be MOV %R14,%RAX |
0x84c1 NOT %RAX |
0x84c4 ADD %RAX,%R15 |
0x84c7 XOR %R8D,%R8D |
0x84ca MOV %R15,-0x30(%RBP) |
0x84ce MOV %RSI,-0x38(%RBP) |
0x84d2 JMP 84f6 |
0x84d4 NOPW %CS:(%RAX,%RAX,1) |
(132) 0x84e0 VMOVSD %XMM0,(%RSI,%R9,8) |
(132) 0x84e6 LEA 0x1(%R8),%RAX |
(132) 0x84ea CMP %R15,%R8 |
(132) 0x84ed MOV %RAX,%R8 |
(132) 0x84f0 JE 8b5c |
(132) 0x84f6 LEA (%R14,%R8,1),%R9 |
(132) 0x84fa VMULSD (%RCX,%R9,8),%XMM5,%XMM0 |
(132) 0x8500 MOV (%RDI,%R9,8),%RDX |
(132) 0x8504 MOV 0x8(%RDI,%R9,8),%R10 |
(132) 0x8509 MOV %R10,%RAX |
(132) 0x850c SUB %RDX,%RAX |
(132) 0x850f JLE 84e0 |
(132) 0x8511 MOV -0x48(%RBP),%RCX |
(132) 0x8515 MOV (%RCX),%R11 |
(132) 0x8518 MOV 0x20(%RBP),%RCX |
(132) 0x851c MOV (%RCX),%RBX |
(132) 0x851f MOV 0x10(%RBP),%RCX |
(132) 0x8523 MOV (%RCX),%R12 |
(132) 0x8526 MOV %RAX,%R13 |
(132) 0x8529 AND $-0x4,%R13 |
(132) 0x852d JE 85a6 |
(132) 0x852f LEA -0x1(%R13),%RCX |
(132) 0x8533 LEA (%R11,%RDX,8),%RSI |
(132) 0x8537 LEA (%R12,%RDX,8),%R14 |
(132) 0x853b VXORPD %XMM1,%XMM1,%XMM1 |
(132) 0x853f XOR %R15D,%R15D |
(132) 0x8542 NOPW %CS:(%RAX,%RAX,1) |
(134) 0x8550 VMOVUPD (%R14,%R15,8),%YMM2 |
(134) 0x8556 VXORPD %XMM3,%XMM3,%XMM3 |
(134) 0x855a KXNORW %K0,%K0,%K1 |
(134) 0x855e VGATHERQPD (%RBX,%YMM2,8),%YMM3{%K1} |
(134) 0x8565 VFMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(134) 0x856b ADD $0x4,%R15 |
(134) 0x856f CMP %RCX,%R15 |
(134) 0x8572 JBE 8550 |
(132) 0x8574 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(132) 0x857a VADDPD %XMM2,%XMM1,%XMM1 |
(132) 0x857e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(132) 0x8583 VADDSD %XMM2,%XMM1,%XMM1 |
(132) 0x8587 VADDSD %XMM1,%XMM0,%XMM0 |
(132) 0x858b CMP %R13,%RAX |
(132) 0x858e MOV -0x40(%RBP),%R14 |
(132) 0x8592 MOV -0x30(%RBP),%R15 |
(132) 0x8596 MOV 0x28(%RBP),%RCX |
(132) 0x859a MOV -0x38(%RBP),%RSI |
(132) 0x859e JE 84e0 |
(132) 0x85a4 JMP 85ad |
(132) 0x85a6 XOR %R13D,%R13D |
(132) 0x85a9 MOV 0x28(%RBP),%RCX |
(132) 0x85ad ADD %RDX,%R13 |
(133) 0x85b0 MOV (%R12,%R13,8),%RAX |
(133) 0x85b4 VMOVSD (%RBX,%RAX,8),%XMM1 |
(133) 0x85b9 VFMADD231SD (%R11,%R13,8),%XMM1,%XMM0 |
(133) 0x85bf INC %R13 |
(133) 0x85c2 CMP %R13,%R10 |
(133) 0x85c5 JNE 85b0 |
(132) 0x85c7 JMP 84e0 |
0x85cc VUCOMISD 0x3a44(%RIP),%XMM0 |
0x85d4 JNE 893c |
0x85da CMP %R15,%R14 |
0x85dd JGE 8b5c |
0x85e3 MOV -0x30(%RBP),%RAX |
0x85e7 MOV (%RAX),%RDI |
0x85ea MOV (%RSI),%RSI |
0x85ed MOV %R14,%RAX |
0x85f0 NOT %RAX |
0x85f3 ADD %RAX,%R15 |
0x85f6 XOR %R8D,%R8D |
0x85f9 VMOVDDUP 0x3a1f(%RIP),%XMM0 |
0x8601 MOV %R15,-0x30(%RBP) |
0x8605 MOV %RSI,-0x38(%RBP) |
0x8609 JMP 8626 |
0x860b NOPL (%RAX,%RAX,1) |
(138) 0x8610 VMOVSD %XMM1,(%RSI,%R9,8) |
(138) 0x8616 LEA 0x1(%R8),%RAX |
(138) 0x861a CMP %R15,%R8 |
(138) 0x861d MOV %RAX,%R8 |
(138) 0x8620 JE 8b5c |
(138) 0x8626 LEA (%R14,%R8,1),%R9 |
(138) 0x862a VMOVSD (%RCX,%R9,8),%XMM1 |
(138) 0x8630 VXORPD %XMM0,%XMM1,%XMM1 |
(138) 0x8634 MOV (%RDI,%R9,8),%RDX |
(138) 0x8638 MOV 0x8(%RDI,%R9,8),%R10 |
(138) 0x863d MOV %R10,%RAX |
(138) 0x8640 SUB %RDX,%RAX |
(138) 0x8643 JLE 8610 |
(138) 0x8645 MOV -0x48(%RBP),%RCX |
(138) 0x8649 MOV (%RCX),%R11 |
(138) 0x864c MOV 0x20(%RBP),%RCX |
(138) 0x8650 MOV (%RCX),%RBX |
(138) 0x8653 MOV 0x10(%RBP),%RCX |
(138) 0x8657 MOV (%RCX),%R12 |
(138) 0x865a MOV %RAX,%R13 |
(138) 0x865d AND $-0x4,%R13 |
(138) 0x8661 JE 86d6 |
(138) 0x8663 LEA -0x1(%R13),%RCX |
(138) 0x8667 LEA (%R11,%RDX,8),%RSI |
(138) 0x866b LEA (%R12,%RDX,8),%R14 |
(138) 0x866f VXORPD %XMM2,%XMM2,%XMM2 |
(138) 0x8673 XOR %R15D,%R15D |
(138) 0x8676 NOPW %CS:(%RAX,%RAX,1) |
(140) 0x8680 VMOVUPD (%R14,%R15,8),%YMM3 |
(140) 0x8686 VXORPD %XMM4,%XMM4,%XMM4 |
(140) 0x868a KXNORW %K0,%K0,%K1 |
(140) 0x868e VGATHERQPD (%RBX,%YMM3,8),%YMM4{%K1} |
(140) 0x8695 VFNMADD231PD (%RSI,%R15,8),%YMM4,%YMM2 |
(140) 0x869b ADD $0x4,%R15 |
(140) 0x869f CMP %RCX,%R15 |
(140) 0x86a2 JBE 8680 |
(138) 0x86a4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(138) 0x86aa VADDPD %XMM3,%XMM2,%XMM2 |
(138) 0x86ae VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(138) 0x86b3 VADDSD %XMM3,%XMM2,%XMM2 |
(138) 0x86b7 VADDSD %XMM2,%XMM1,%XMM1 |
(138) 0x86bb CMP %R13,%RAX |
(138) 0x86be MOV -0x40(%RBP),%R14 |
(138) 0x86c2 MOV -0x30(%RBP),%R15 |
(138) 0x86c6 MOV 0x28(%RBP),%RCX |
(138) 0x86ca MOV -0x38(%RBP),%RSI |
(138) 0x86ce JE 8610 |
(138) 0x86d4 JMP 86dd |
(138) 0x86d6 XOR %R13D,%R13D |
(138) 0x86d9 MOV 0x28(%RBP),%RCX |
(138) 0x86dd ADD %RDX,%R13 |
(139) 0x86e0 MOV (%R12,%R13,8),%RAX |
(139) 0x86e4 VMOVSD (%RBX,%RAX,8),%XMM2 |
(139) 0x86e9 VFNMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(139) 0x86ef INC %R13 |
(139) 0x86f2 CMP %R13,%R10 |
(139) 0x86f5 JNE 86e0 |
(138) 0x86f7 JMP 8610 |
0x86fc CMP %R15,%R14 |
0x86ff JGE 8b5c |
0x8705 MOV -0x30(%RBP),%RAX |
0x8709 MOV (%RAX),%RDI |
0x870c MOV (%RSI),%RSI |
0x870f MOV %R14,%RAX |
0x8712 NOT %RAX |
0x8715 ADD %RAX,%R15 |
0x8718 XOR %R8D,%R8D |
0x871b VMOVDDUP 0x38fd(%RIP),%XMM1 |
0x8723 MOV %R15,-0x30(%RBP) |
0x8727 MOV %RSI,-0x38(%RBP) |
0x872b JMP 874a |
0x872d NOPL (%RAX) |
(144) 0x8730 VMULSD %XMM0,%XMM2,%XMM2 |
(144) 0x8734 VMOVSD %XMM2,(%RSI,%R9,8) |
(144) 0x873a LEA 0x1(%R8),%RAX |
(144) 0x873e CMP %R15,%R8 |
(144) 0x8741 MOV %RAX,%R8 |
(144) 0x8744 JE 8b5c |
(144) 0x874a LEA (%R14,%R8,1),%R9 |
(144) 0x874e VMOVSD (%RCX,%R9,8),%XMM2 |
(144) 0x8754 VXORPD %XMM1,%XMM2,%XMM2 |
(144) 0x8758 MOV (%RDI,%R9,8),%RDX |
(144) 0x875c MOV 0x8(%RDI,%R9,8),%R10 |
(144) 0x8761 MOV %R10,%RAX |
(144) 0x8764 SUB %RDX,%RAX |
(144) 0x8767 JLE 8730 |
(144) 0x8769 MOV -0x48(%RBP),%RCX |
(144) 0x876d MOV (%RCX),%R11 |
(144) 0x8770 MOV 0x20(%RBP),%RCX |
(144) 0x8774 MOV (%RCX),%RBX |
(144) 0x8777 MOV 0x10(%RBP),%RCX |
(144) 0x877b MOV (%RCX),%R12 |
(144) 0x877e MOV %RAX,%R13 |
(144) 0x8781 AND $-0x4,%R13 |
(144) 0x8785 JE 87f6 |
(144) 0x8787 LEA -0x1(%R13),%RCX |
(144) 0x878b LEA (%R11,%RDX,8),%RSI |
(144) 0x878f LEA (%R12,%RDX,8),%R14 |
(144) 0x8793 VXORPD %XMM3,%XMM3,%XMM3 |
(144) 0x8797 XOR %R15D,%R15D |
(144) 0x879a NOPW (%RAX,%RAX,1) |
(146) 0x87a0 VMOVUPD (%R14,%R15,8),%YMM4 |
(146) 0x87a6 KXNORW %K0,%K0,%K1 |
(146) 0x87aa VXORPD %XMM5,%XMM5,%XMM5 |
(146) 0x87ae VGATHERQPD (%RBX,%YMM4,8),%YMM5{%K1} |
(146) 0x87b5 VFMADD231PD (%RSI,%R15,8),%YMM5,%YMM3 |
(146) 0x87bb ADD $0x4,%R15 |
(146) 0x87bf CMP %RCX,%R15 |
(146) 0x87c2 JBE 87a0 |
(144) 0x87c4 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(144) 0x87ca VADDPD %XMM4,%XMM3,%XMM3 |
(144) 0x87ce VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(144) 0x87d3 VADDSD %XMM4,%XMM3,%XMM3 |
(144) 0x87d7 VADDSD %XMM3,%XMM2,%XMM2 |
(144) 0x87db CMP %R13,%RAX |
(144) 0x87de MOV -0x40(%RBP),%R14 |
(144) 0x87e2 MOV -0x30(%RBP),%R15 |
(144) 0x87e6 MOV 0x28(%RBP),%RCX |
(144) 0x87ea MOV -0x38(%RBP),%RSI |
(144) 0x87ee JE 8730 |
(144) 0x87f4 JMP 87fd |
(144) 0x87f6 XOR %R13D,%R13D |
(144) 0x87f9 MOV 0x28(%RBP),%RCX |
(144) 0x87fd ADD %RDX,%R13 |
(145) 0x8800 MOV (%R12,%R13,8),%RAX |
(145) 0x8804 VMOVSD (%RBX,%RAX,8),%XMM3 |
(145) 0x8809 VFMADD231SD (%R11,%R13,8),%XMM3,%XMM2 |
(145) 0x880f INC %R13 |
(145) 0x8812 CMP %R13,%R10 |
(145) 0x8815 JNE 8800 |
(144) 0x8817 JMP 8730 |
0x881c VUCOMISD 0x37f4(%RIP),%XMM0 |
0x8824 JNE 8a4c |
0x882a CMP %R15,%R14 |
0x882d JGE 8b5c |
0x8833 VXORPD 0x37e3(%RIP){1to2},%XMM5,%XMM0 |
0x883d MOV -0x30(%RBP),%RAX |
0x8841 MOV (%RAX),%RDI |
0x8844 MOV (%RSI),%RDX |
0x8847 MOV %R14,%RAX |
0x884a NOT %RAX |
0x884d ADD %RAX,%R15 |
0x8850 XOR %R8D,%R8D |
0x8853 MOV %R15,-0x30(%RBP) |
0x8857 MOV %RDX,-0x38(%RBP) |
0x885b JMP 8873 |
(129) 0x885d VMOVSD %XMM1,(%RDX,%R9,8) |
(129) 0x8863 LEA 0x1(%R8),%RAX |
(129) 0x8867 CMP %R15,%R8 |
(129) 0x886a MOV %RAX,%R8 |
(129) 0x886d JE 8b5c |
(129) 0x8873 LEA (%R14,%R8,1),%R9 |
(129) 0x8877 VMULSD (%RCX,%R9,8),%XMM0,%XMM1 |
(129) 0x887d MOV (%RDI,%R9,8),%RSI |
(129) 0x8881 MOV 0x8(%RDI,%R9,8),%R10 |
(129) 0x8886 MOV %R10,%RAX |
(129) 0x8889 SUB %RSI,%RAX |
(129) 0x888c JLE 885d |
(129) 0x888e MOV -0x48(%RBP),%RCX |
(129) 0x8892 MOV (%RCX),%R11 |
(129) 0x8895 MOV 0x20(%RBP),%RCX |
(129) 0x8899 MOV (%RCX),%RBX |
(129) 0x889c MOV 0x10(%RBP),%RCX |
(129) 0x88a0 MOV (%RCX),%R12 |
(129) 0x88a3 MOV %RAX,%R13 |
(129) 0x88a6 AND $-0x4,%R13 |
(129) 0x88aa JE 8916 |
(129) 0x88ac LEA -0x1(%R13),%RDX |
(129) 0x88b0 LEA (%R11,%RSI,8),%RCX |
(129) 0x88b4 LEA (%R12,%RSI,8),%R14 |
(129) 0x88b8 VXORPD %XMM2,%XMM2,%XMM2 |
(129) 0x88bc XOR %R15D,%R15D |
(129) 0x88bf NOP |
(131) 0x88c0 VMOVUPD (%R14,%R15,8),%YMM3 |
(131) 0x88c6 VXORPD %XMM4,%XMM4,%XMM4 |
(131) 0x88ca KXNORW %K0,%K0,%K1 |
(131) 0x88ce VGATHERQPD (%RBX,%YMM3,8),%YMM4{%K1} |
(131) 0x88d5 VFNMADD231PD (%RCX,%R15,8),%YMM4,%YMM2 |
(131) 0x88db ADD $0x4,%R15 |
(131) 0x88df CMP %RDX,%R15 |
(131) 0x88e2 JBE 88c0 |
(129) 0x88e4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(129) 0x88ea VADDPD %XMM3,%XMM2,%XMM2 |
(129) 0x88ee VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(129) 0x88f3 VADDSD %XMM3,%XMM2,%XMM2 |
(129) 0x88f7 VADDSD %XMM2,%XMM1,%XMM1 |
(129) 0x88fb CMP %R13,%RAX |
(129) 0x88fe MOV -0x40(%RBP),%R14 |
(129) 0x8902 MOV -0x30(%RBP),%R15 |
(129) 0x8906 MOV 0x28(%RBP),%RCX |
(129) 0x890a MOV -0x38(%RBP),%RDX |
(129) 0x890e JE 885d |
(129) 0x8914 JMP 891d |
(129) 0x8916 XOR %R13D,%R13D |
(129) 0x8919 MOV 0x28(%RBP),%RCX |
(129) 0x891d ADD %RSI,%R13 |
(130) 0x8920 MOV (%R12,%R13,8),%RAX |
(130) 0x8924 VMOVSD (%RBX,%RAX,8),%XMM2 |
(130) 0x8929 VFNMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(130) 0x892f INC %R13 |
(130) 0x8932 CMP %R13,%R10 |
(130) 0x8935 JNE 8920 |
(129) 0x8937 JMP 885d |
0x893c CMP %R15,%R14 |
0x893f JGE 8b5c |
0x8945 MOV -0x30(%RBP),%RAX |
0x8949 MOV (%RAX),%RDI |
0x894c MOV (%RSI),%RSI |
0x894f MOV %R14,%RAX |
0x8952 NOT %RAX |
0x8955 ADD %RAX,%R15 |
0x8958 XOR %R8D,%R8D |
0x895b MOV %R15,-0x30(%RBP) |
0x895f MOV %RSI,-0x38(%RBP) |
0x8963 JMP 897f |
(135) 0x8965 VMULSD %XMM0,%XMM1,%XMM1 |
(135) 0x8969 VMOVSD %XMM1,(%RSI,%R9,8) |
(135) 0x896f LEA 0x1(%R8),%RAX |
(135) 0x8973 CMP %R15,%R8 |
(135) 0x8976 MOV %RAX,%R8 |
(135) 0x8979 JE 8b5c |
(135) 0x897f LEA (%R14,%R8,1),%R9 |
(135) 0x8983 VMOVSD (%RCX,%R9,8),%XMM1 |
(135) 0x8989 MOV (%RDI,%R9,8),%RDX |
(135) 0x898d MOV 0x8(%RDI,%R9,8),%R10 |
(135) 0x8992 MOV %R10,%RAX |
(135) 0x8995 SUB %RDX,%RAX |
(135) 0x8998 JLE 8965 |
(135) 0x899a MOV -0x48(%RBP),%RCX |
(135) 0x899e MOV (%RCX),%R11 |
(135) 0x89a1 MOV 0x20(%RBP),%RCX |
(135) 0x89a5 MOV (%RCX),%RBX |
(135) 0x89a8 MOV 0x10(%RBP),%RCX |
(135) 0x89ac MOV (%RCX),%R12 |
(135) 0x89af MOV %RAX,%R13 |
(135) 0x89b2 AND $-0x4,%R13 |
(135) 0x89b6 JE 8a26 |
(135) 0x89b8 LEA -0x1(%R13),%RCX |
(135) 0x89bc LEA (%R11,%RDX,8),%RSI |
(135) 0x89c0 LEA (%R12,%RDX,8),%R14 |
(135) 0x89c4 VXORPD %XMM2,%XMM2,%XMM2 |
(135) 0x89c8 XOR %R15D,%R15D |
(135) 0x89cb NOPL (%RAX,%RAX,1) |
(137) 0x89d0 VMOVUPD (%R14,%R15,8),%YMM3 |
(137) 0x89d6 VXORPD %XMM4,%XMM4,%XMM4 |
(137) 0x89da KXNORW %K0,%K0,%K1 |
(137) 0x89de VGATHERQPD (%RBX,%YMM3,8),%YMM4{%K1} |
(137) 0x89e5 VFMADD231PD (%RSI,%R15,8),%YMM4,%YMM2 |
(137) 0x89eb ADD $0x4,%R15 |
(137) 0x89ef CMP %RCX,%R15 |
(137) 0x89f2 JBE 89d0 |
(135) 0x89f4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(135) 0x89fa VADDPD %XMM3,%XMM2,%XMM2 |
(135) 0x89fe VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(135) 0x8a03 VADDSD %XMM3,%XMM2,%XMM2 |
(135) 0x8a07 VADDSD %XMM2,%XMM1,%XMM1 |
(135) 0x8a0b CMP %R13,%RAX |
(135) 0x8a0e MOV -0x40(%RBP),%R14 |
(135) 0x8a12 MOV -0x30(%RBP),%R15 |
(135) 0x8a16 MOV 0x28(%RBP),%RCX |
(135) 0x8a1a MOV -0x38(%RBP),%RSI |
(135) 0x8a1e JE 8965 |
(135) 0x8a24 JMP 8a2d |
(135) 0x8a26 XOR %R13D,%R13D |
(135) 0x8a29 MOV 0x28(%RBP),%RCX |
(135) 0x8a2d ADD %RDX,%R13 |
(136) 0x8a30 MOV (%R12,%R13,8),%RAX |
(136) 0x8a34 VMOVSD (%RBX,%RAX,8),%XMM2 |
(136) 0x8a39 VFMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(136) 0x8a3f INC %R13 |
(136) 0x8a42 CMP %R13,%R10 |
(136) 0x8a45 JNE 8a30 |
(135) 0x8a47 JMP 8965 |
0x8a4c CMP %R15,%R14 |
0x8a4f JGE 8b5c |
0x8a55 MOV -0x30(%RBP),%RAX |
0x8a59 MOV (%RAX),%RDI |
0x8a5c MOV (%RSI),%RDX |
0x8a5f MOV %R14,%RAX |
0x8a62 NOT %RAX |
0x8a65 ADD %RAX,%R15 |
0x8a68 XOR %R8D,%R8D |
0x8a6b MOV %R15,-0x30(%RBP) |
0x8a6f MOV %RDX,-0x38(%RBP) |
0x8a73 JMP 8a8f |
(126) 0x8a75 VMULSD %XMM0,%XMM1,%XMM1 |
(126) 0x8a79 VMOVSD %XMM1,(%RDX,%R9,8) |
(126) 0x8a7f LEA 0x1(%R8),%RAX |
(126) 0x8a83 CMP %R15,%R8 |
(126) 0x8a86 MOV %RAX,%R8 |
(126) 0x8a89 JE 8b5c |
(126) 0x8a8f LEA (%R14,%R8,1),%R9 |
(126) 0x8a93 VMULSD (%RCX,%R9,8),%XMM5,%XMM1 |
(126) 0x8a99 MOV (%RDI,%R9,8),%RSI |
(126) 0x8a9d MOV 0x8(%RDI,%R9,8),%R10 |
(126) 0x8aa2 MOV %R10,%RAX |
(126) 0x8aa5 SUB %RSI,%RAX |
(126) 0x8aa8 JLE 8a75 |
(126) 0x8aaa MOV -0x48(%RBP),%RCX |
(126) 0x8aae MOV (%RCX),%R11 |
(126) 0x8ab1 MOV 0x20(%RBP),%RCX |
(126) 0x8ab5 MOV (%RCX),%RBX |
(126) 0x8ab8 MOV 0x10(%RBP),%RCX |
(126) 0x8abc MOV (%RCX),%R12 |
(126) 0x8abf MOV %RAX,%R13 |
(126) 0x8ac2 AND $-0x4,%R13 |
(126) 0x8ac6 JE 8b36 |
(126) 0x8ac8 LEA -0x1(%R13),%RDX |
(126) 0x8acc LEA (%R11,%RSI,8),%RCX |
(126) 0x8ad0 LEA (%R12,%RSI,8),%R14 |
(126) 0x8ad4 VXORPD %XMM2,%XMM2,%XMM2 |
(126) 0x8ad8 XOR %R15D,%R15D |
(126) 0x8adb NOPL (%RAX,%RAX,1) |
(128) 0x8ae0 VMOVUPD (%R14,%R15,8),%YMM3 |
(128) 0x8ae6 KXNORW %K0,%K0,%K1 |
(128) 0x8aea VXORPD %XMM4,%XMM4,%XMM4 |
(128) 0x8aee VGATHERQPD (%RBX,%YMM3,8),%YMM4{%K1} |
(128) 0x8af5 VFMADD231PD (%RCX,%R15,8),%YMM4,%YMM2 |
(128) 0x8afb ADD $0x4,%R15 |
(128) 0x8aff CMP %RDX,%R15 |
(128) 0x8b02 JBE 8ae0 |
(126) 0x8b04 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(126) 0x8b0a VADDPD %XMM3,%XMM2,%XMM2 |
(126) 0x8b0e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(126) 0x8b13 VADDSD %XMM3,%XMM2,%XMM2 |
(126) 0x8b17 VADDSD %XMM2,%XMM1,%XMM1 |
(126) 0x8b1b CMP %R13,%RAX |
(126) 0x8b1e MOV -0x40(%RBP),%R14 |
(126) 0x8b22 MOV -0x30(%RBP),%R15 |
(126) 0x8b26 MOV 0x28(%RBP),%RCX |
(126) 0x8b2a MOV -0x38(%RBP),%RDX |
(126) 0x8b2e JE 8a75 |
(126) 0x8b34 JMP 8b3d |
(126) 0x8b36 XOR %R13D,%R13D |
(126) 0x8b39 MOV 0x28(%RBP),%RCX |
(126) 0x8b3d ADD %RSI,%R13 |
(127) 0x8b40 MOV (%R12,%R13,8),%RAX |
(127) 0x8b44 VMOVSD (%RBX,%RAX,8),%XMM2 |
(127) 0x8b49 VFMADD231SD (%R11,%R13,8),%XMM2,%XMM1 |
(127) 0x8b4f INC %R13 |
(127) 0x8b52 CMP %R13,%R10 |
(127) 0x8b55 JNE 8b40 |
(126) 0x8b57 JMP 8a75 |
0x8b5c ADD $0x28,%RSP |
0x8b60 POP %RBX |
0x8b61 POP %R12 |
0x8b63 POP %R13 |
0x8b65 POP %R14 |
0x8b67 POP %R15 |
0x8b69 POP %RBP |
0x8b6a VZEROUPPER |
0x8b6d RET |
0x8b6e XCHG %AX,%AX |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | libseq_mv.so |
nb instructions | 320 |
nb uops | 357 |
loop length | 1268 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 8 |
micro-operation queue | 59.50 cycles |
front end | 59.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 27.00 | 25.00 | 25.33 | 25.33 | 23.50 | 25.00 | 27.00 | 23.50 | 23.50 | 23.50 | 25.00 | 25.33 |
cycles | 27.00 | 27.40 | 25.33 | 25.33 | 23.50 | 25.00 | 27.00 | 23.50 | 23.50 | 23.50 | 25.00 | 25.33 |
Cycles executing div or sqrt instructions | 32.00 |
FE+BE cycles | 56.66 |
Stall cycles | 0.00 |
Front-end | 59.50 |
Dispatch | 27.40 |
DIV/SQRT | 32.00 |
Overall L1 | 59.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 4% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R14,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 7c22 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x82> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 7c2b <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 7c33 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x93> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RCX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7c33 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x93> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JG 7bf9 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x59> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVQ $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R14,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 7c66 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 7c6a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xca> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 7e9d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x2fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 7c9c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R12,%R15,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 7cd8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x138> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x9338(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x46bb(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x465c(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x45cb(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 7ce6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x146> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 7d1d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x17d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x92f3(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x4676(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x4626(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x4586(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 7d2c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x18c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 7d68 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x92ad(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x4630(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x4602(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x4540(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 7eae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x30e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x4289(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 7fec <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x44c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7dd6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x236> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JG 7ca1 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x101> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 7cd8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x138> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x28(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x415e(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 810d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x56d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x4148(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 824c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x6ac> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x412b(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7f16 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x376> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x4024(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 837c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7dc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8046 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4a6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3efb(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 849d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3eed(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 85cc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa2c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8176 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x5d6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3dc4(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 86fc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb5c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 82a6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x706> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 83ca <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x82a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3b6b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 881c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 84f6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x956> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3a44(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 893c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd9c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x3a1f(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8626 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa86> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x38fd(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 874a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbaa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x37f4(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 8a4c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xeac> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x37e3(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8873 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcd3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 897f <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xddf> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8a8f <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xeef> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matvec.c:243-404 |
Module | libseq_mv.so |
nb instructions | 320 |
nb uops | 357 |
loop length | 1268 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 8 |
micro-operation queue | 59.50 cycles |
front end | 59.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 27.00 | 25.00 | 25.33 | 25.33 | 23.50 | 25.00 | 27.00 | 23.50 | 23.50 | 23.50 | 25.00 | 25.33 |
cycles | 27.00 | 27.40 | 25.33 | 25.33 | 23.50 | 25.00 | 27.00 | 23.50 | 23.50 | 23.50 | 25.00 | 25.33 |
Cycles executing div or sqrt instructions | 32.00 |
FE+BE cycles | 56.66 |
Stall cycles | 0.00 |
Front-end | 59.50 |
Dispatch | 27.40 |
DIV/SQRT | 32.00 |
Overall L1 | 59.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 4% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R14,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 7c22 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x82> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 7c2b <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 7c33 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x93> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RCX,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
SUB %R12,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7c33 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x93> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JG 7bf9 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x59> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOVQ $0,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CALL 3080 <hypre_GetThreadNum@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x20(%R15),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R15),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%R15),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 3170 <hypre_NumActiveThreads@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x1(%R14,%RAX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 7c66 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %RCX | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 7c6a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xca> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %ECX | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x40(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 7e9d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x2fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
INC %RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RBX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 7c9c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R12,%R15,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RBX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 3140 <hypre_LowerBound@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAR $0x3,%R15 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 7cd8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x138> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x9338(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x46bb(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x465c(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x45cb(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 7ce6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x146> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 7d1d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x17d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x92f3(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x4676(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x4626(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x4586(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 7d2c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x18c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 7d68 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1c8> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x92ad(%RIP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x4630(%RIP),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x4602(%RIP),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 31e0 <hypre_fprintf@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA 0x4540(%RIP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 3220 <hypre_error_handler@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JNE 7eae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x30e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x4289(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 7fec <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x44c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7dd6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x236> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R15D,%R15D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JG 7ca1 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x101> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 7cd8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x138> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV 0x28(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x415e(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 810d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x56d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x4148(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 824c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x6ac> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x412b(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 7f16 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x376> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x4024(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 837c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7dc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8046 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4a6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3efb(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 849d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x3eed(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 85cc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa2c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8176 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x5d6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3dc4(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 86fc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb5c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 82a6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x706> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 83ca <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x82a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3b6b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 881c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 84f6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x956> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x3a44(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 893c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd9c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x3a1f(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8626 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa86> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x38fd(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 874a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbaa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x37f4(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 8a4c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xeac> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x37e3(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8873 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcd3> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 897f <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xddf> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 8b5c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8a8f <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xeef> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted– | 17.95 | 3.7 |
▼Loop 141 - csr_matvec.c:334-341 - libseq_mv.so– | 0.64 | 0.12 |
○Loop 142 - csr_matvec.c:337-339 - libseq_mv.so | 0.5 | 0.09 |
○Loop 143 - csr_matvec.c:337-339 - libseq_mv.so | 0.13 | 0.02 |
▼Loop 147 - csr_matvec.c:307-314 - libseq_mv.so– | 0.53 | 0.1 |
○Loop 149 - csr_matvec.c:310-312 - libseq_mv.so | 7.11 | 1.33 |
○Loop 148 - csr_matvec.c:310-312 - libseq_mv.so | 1.03 | 0.19 |
▼Loop 159 - csr_matvec.c:256-263 - libseq_mv.so– | 0.35 | 0.06 |
○Loop 161 - csr_matvec.c:259-261 - libseq_mv.so | 6.72 | 1.26 |
○Loop 160 - csr_matvec.c:259-261 - libseq_mv.so | 0.95 | 0.18 |
▼Loop 153 - csr_matvec.c:280-287 - libseq_mv.so– | 0 | 0 |
○Loop 154 - csr_matvec.c:283-285 - libseq_mv.so | 0 | 0 |
○Loop 155 - csr_matvec.c:283-285 - libseq_mv.so | 0 | 0 |
▼Loop 129 - csr_matvec.c:385-392 - libseq_mv.so– | 0 | 0 |
○Loop 130 - csr_matvec.c:388-390 - libseq_mv.so | 0 | 0 |
○Loop 131 - csr_matvec.c:388-390 - libseq_mv.so | 0 | 0 |
▼Loop 144 - csr_matvec.c:319-326 - libseq_mv.so– | 0 | 0 |
○Loop 146 - csr_matvec.c:322-324 - libseq_mv.so | 0 | 0.01 |
○Loop 145 - csr_matvec.c:322-324 - libseq_mv.so | 0 | 0 |
▼Loop 150 - csr_matvec.c:295-302 - libseq_mv.so– | 0 | 0 |
○Loop 152 - csr_matvec.c:298-300 - libseq_mv.so | 0 | 0 |
○Loop 151 - csr_matvec.c:298-300 - libseq_mv.so | 0 | 0 |
▼Loop 138 - csr_matvec.c:346-353 - libseq_mv.so– | 0 | 0 |
○Loop 140 - csr_matvec.c:349-351 - libseq_mv.so | 0 | 0 |
○Loop 139 - csr_matvec.c:349-351 - libseq_mv.so | 0 | 0 |
▼Loop 156 - csr_matvec.c:268-275 - libseq_mv.so– | 0 | 0 |
○Loop 158 - csr_matvec.c:271-273 - libseq_mv.so | 0 | 0 |
○Loop 157 - csr_matvec.c:271-273 - libseq_mv.so | 0 | 0 |
▼Loop 132 - csr_matvec.c:373-380 - libseq_mv.so– | 0 | 0 |
○Loop 133 - csr_matvec.c:376-378 - libseq_mv.so | 0 | 0 |
○Loop 134 - csr_matvec.c:376-378 - libseq_mv.so | 0 | 0 |
▼Loop 126 - csr_matvec.c:397-404 - libseq_mv.so– | 0 | 0 |
○Loop 128 - csr_matvec.c:400-402 - libseq_mv.so | 0 | 0 |
○Loop 127 - csr_matvec.c:400-402 - libseq_mv.so | 0 | 0 |
▼Loop 135 - csr_matvec.c:358-365 - libseq_mv.so– | 0 | 0 |
○Loop 137 - csr_matvec.c:361-363 - libseq_mv.so | 0 | 0 |
○Loop 136 - csr_matvec.c:361-363 - libseq_mv.so | 0 | 0 |