Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 14.69% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 14.69% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-112-7443/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
0x510a70 PUSH %RBP |
0x510a71 MOV %RSP,%RBP |
0x510a74 PUSH %R15 |
0x510a76 PUSH %R14 |
0x510a78 PUSH %R13 |
0x510a7a PUSH %R12 |
0x510a7c PUSH %RBX |
0x510a7d SUB $0x18,%RSP |
0x510a81 MOV %R9,%RBX |
0x510a84 MOV %R8,%R14 |
0x510a87 MOV %RCX,%R12 |
0x510a8a MOV %RDX,-0x38(%RBP) |
0x510a8e MOV %RCX,%RDI |
0x510a91 CALL 50efa0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> |
0x510a96 MOV %R12,%RDI |
0x510a99 MOV %RAX,%R12 |
0x510a9c CALL 50f060 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> |
0x510aa1 MOV %RAX,%R15 |
0x510aa4 CMP %RAX,%R12 |
0x510aa7 JLE 510ad7 |
0x510aa9 MOV 0x52150(%RIP),%RDI |
0x510ab0 MOV $0x53be7d,%ESI |
0x510ab5 MOV $0x53de03,%EDX |
0x510aba XOR %EAX,%EAX |
0x510abc CALL 51b970 <hypre_fprintf> |
0x510ac1 MOV $0x53e799,%EDI |
0x510ac6 MOV $0xf8,%ESI |
0x510acb MOV $0x1,%EDX |
0x510ad0 XOR %ECX,%ECX |
0x510ad2 CALL 51e980 <hypre_error_handler> |
0x510ad7 MOV 0x18(%RBP),%R13 |
0x510adb TEST %R12,%R12 |
0x510ade JS 510ae5 |
0x510ae0 CMP %R13,%R12 |
0x510ae3 JLE 510b13 |
0x510ae5 MOV 0x52114(%RIP),%RDI |
0x510aec MOV $0x53be7d,%ESI |
0x510af1 MOV $0x53e81c,%EDX |
0x510af6 XOR %EAX,%EAX |
0x510af8 CALL 51b970 <hypre_fprintf> |
0x510afd MOV $0x53e799,%EDI |
0x510b02 MOV $0xf9,%ESI |
0x510b07 MOV $0x1,%EDX |
0x510b0c XOR %ECX,%ECX |
0x510b0e CALL 51e980 <hypre_error_handler> |
0x510b13 VMOVSD 0x38(%RBP),%XMM5 |
0x510b18 TEST %R15,%R15 |
0x510b1b JS 510b22 |
0x510b1d CMP %R13,%R15 |
0x510b20 JLE 510b55 |
0x510b22 MOV 0x520d7(%RIP),%RDI |
0x510b29 MOV $0x53be7d,%ESI |
0x510b2e MOV $0x53e83e,%EDX |
0x510b33 XOR %EAX,%EAX |
0x510b35 CALL 51b970 <hypre_fprintf> |
0x510b3a MOV $0x53e799,%EDI |
0x510b3f MOV $0xfa,%ESI |
0x510b44 MOV $0x1,%EDX |
0x510b49 XOR %ECX,%ECX |
0x510b4b CALL 51e980 <hypre_error_handler> |
0x510b50 VMOVSD 0x38(%RBP),%XMM5 |
0x510b55 MOV 0x30(%RBP),%R13 |
0x510b59 MOV 0x20(%RBP),%RCX |
0x510b5d MOV 0x10(%RBP),%RDX |
0x510b61 VMOVSD -0x38(%RBP),%XMM0 |
0x510b66 VXORPD %XMM1,%XMM1,%XMM1 |
0x510b6a VUCOMISD %XMM1,%XMM5 |
0x510b6e MOV %R12,-0x38(%RBP) |
0x510b72 MOV %RBX,-0x30(%RBP) |
0x510b76 JNE 510cc0 |
0x510b7c VUCOMISD 0x1948c(%RIP),%XMM0 |
0x510b84 JNE 510e00 |
0x510b8a CMP %R15,%R12 |
0x510b8d JGE 511a80 |
0x510b93 MOV %R12,%RAX |
0x510b96 NOT %RAX |
0x510b99 ADD %RAX,%R15 |
0x510b9c XOR %ESI,%ESI |
0x510b9e JMP 510bd4 |
0x510ba0 NOPW %CS:(%RAX,%RAX,1) |
0x510baf NOPW %CS:(%RAX,%RAX,1) |
0x510bbe XCHG %AX,%AX |
(4339) 0x510bc0 VMOVSD %XMM0,(%R13,%RDI,8) |
(4339) 0x510bc7 CMP %R15,%RSI |
(4339) 0x510bca LEA 0x1(%RSI),%RSI |
(4339) 0x510bce JE 511a80 |
(4339) 0x510bd4 LEA (%R12,%RSI,1),%RDI |
(4339) 0x510bd8 MOV (%RBX,%RDI,8),%R10 |
(4339) 0x510bdc MOV 0x8(%RBX,%RDI,8),%R8 |
(4339) 0x510be1 VXORPD %XMM0,%XMM0,%XMM0 |
(4339) 0x510be5 MOV %R8,%R11 |
(4339) 0x510be8 SUB %R10,%R11 |
(4339) 0x510beb JLE 510bc0 |
(4339) 0x510bed MOV %R11,%R9 |
(4339) 0x510bf0 AND $-0x4,%R9 |
(4339) 0x510bf4 JE 510c80 |
(4339) 0x510bfa MOV %R15,%RBX |
(4339) 0x510bfd LEA -0x1(%R9),%R15 |
(4339) 0x510c01 LEA (%R14,%R10,8),%R13 |
(4339) 0x510c05 LEA (%RDX,%R10,8),%RAX |
(4339) 0x510c09 VXORPD %XMM0,%XMM0,%XMM0 |
(4339) 0x510c0d XOR %R12D,%R12D |
(4341) 0x510c10 VMOVUPD (%RAX,%R12,8),%YMM1 |
(4341) 0x510c16 KXNORW %K0,%K0,%K1 |
(4341) 0x510c1a VXORPD %XMM2,%XMM2,%XMM2 |
(4341) 0x510c1e VGATHERQPD (%RCX,%YMM1,8),%YMM2{%K1} |
(4341) 0x510c25 VFMADD231PD (%R13,%R12,8),%YMM2,%YMM0 |
(4341) 0x510c2c ADD $0x4,%R12 |
(4341) 0x510c30 CMP %R15,%R12 |
(4341) 0x510c33 JBE 510c10 |
(4339) 0x510c35 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(4339) 0x510c3b VADDPD %XMM1,%XMM0,%XMM0 |
(4339) 0x510c3f VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(4339) 0x510c44 VADDSD %XMM1,%XMM0,%XMM0 |
(4339) 0x510c48 CMP %R9,%R11 |
(4339) 0x510c4b MOV -0x38(%RBP),%R12 |
(4339) 0x510c4f MOV %RBX,%R15 |
(4339) 0x510c52 MOV -0x30(%RBP),%RBX |
(4339) 0x510c56 MOV 0x30(%RBP),%R13 |
(4339) 0x510c5a JE 510bc0 |
(4339) 0x510c60 JMP 510c83 |
0x510c62 NOPW %CS:(%RAX,%RAX,1) |
0x510c71 NOPW %CS:(%RAX,%RAX,1) |
(4339) 0x510c80 XOR %R9D,%R9D |
(4339) 0x510c83 ADD %R10,%R9 |
(4339) 0x510c86 NOPW %CS:(%RAX,%RAX,1) |
(4340) 0x510c90 MOV (%RDX,%R9,8),%RAX |
(4340) 0x510c94 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4340) 0x510c99 VFMADD231SD (%R14,%R9,8),%XMM1,%XMM0 |
(4340) 0x510c9f INC %R9 |
(4340) 0x510ca2 CMP %R9,%R8 |
(4340) 0x510ca5 JNE 510c90 |
(4339) 0x510ca7 JMP 510bc0 |
0x510cac NOPW %CS:(%RAX,%RAX,1) |
0x510cbb NOPL (%RAX,%RAX,1) |
0x510cc0 VUCOMISD 0x1a228(%RIP),%XMM5 |
0x510cc8 MOV %R15,%RSI |
0x510ccb JNE 510f40 |
0x510cd1 VUCOMISD 0x19337(%RIP),%XMM0 |
0x510cd9 JNE 511080 |
0x510cdf CMP %RSI,%R12 |
0x510ce2 JGE 511a80 |
0x510ce8 MOV %R12,%RAX |
0x510ceb NOT %RAX |
0x510cee ADD %RAX,%RSI |
0x510cf1 XOR %EDI,%EDI |
0x510cf3 VMOVDDUP 0x19fa5(%RIP),%XMM0 |
0x510cfb JMP 510d14 |
0x510cfd NOPL (%RAX) |
(4330) 0x510d00 VMOVSD %XMM1,(%R13,%R8,8) |
(4330) 0x510d07 CMP %RSI,%RDI |
(4330) 0x510d0a LEA 0x1(%RDI),%RDI |
(4330) 0x510d0e JE 511a80 |
(4330) 0x510d14 LEA (%R12,%RDI,1),%R8 |
(4330) 0x510d18 MOV 0x28(%RBP),%RAX |
(4330) 0x510d1c VMOVSD (%RAX,%R8,8),%XMM1 |
(4330) 0x510d22 VXORPD %XMM0,%XMM1,%XMM1 |
(4330) 0x510d26 MOV (%RBX,%R8,8),%R11 |
(4330) 0x510d2a MOV 0x8(%RBX,%R8,8),%R9 |
(4330) 0x510d2f MOV %R9,%R15 |
(4330) 0x510d32 SUB %R11,%R15 |
(4330) 0x510d35 JLE 510d00 |
(4330) 0x510d37 MOV %R15,%R10 |
(4330) 0x510d3a AND $-0x4,%R10 |
(4330) 0x510d3e JE 510dc0 |
(4330) 0x510d44 MOV %RSI,%RBX |
(4330) 0x510d47 LEA -0x1(%R10),%R13 |
(4330) 0x510d4b LEA (%R14,%R11,8),%RSI |
(4330) 0x510d4f LEA (%RDX,%R11,8),%RAX |
(4330) 0x510d53 VXORPD %XMM2,%XMM2,%XMM2 |
(4330) 0x510d57 XOR %R12D,%R12D |
(4330) 0x510d5a NOPW (%RAX,%RAX,1) |
(4332) 0x510d60 VMOVUPD (%RAX,%R12,8),%YMM3 |
(4332) 0x510d66 KXNORW %K0,%K0,%K1 |
(4332) 0x510d6a VXORPD %XMM4,%XMM4,%XMM4 |
(4332) 0x510d6e VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4332) 0x510d75 VFMADD231PD (%RSI,%R12,8),%YMM4,%YMM2 |
(4332) 0x510d7b ADD $0x4,%R12 |
(4332) 0x510d7f CMP %R13,%R12 |
(4332) 0x510d82 JBE 510d60 |
(4330) 0x510d84 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4330) 0x510d8a VADDPD %XMM3,%XMM2,%XMM2 |
(4330) 0x510d8e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4330) 0x510d93 VADDSD %XMM3,%XMM2,%XMM2 |
(4330) 0x510d97 VADDSD %XMM2,%XMM1,%XMM1 |
(4330) 0x510d9b CMP %R10,%R15 |
(4330) 0x510d9e MOV -0x38(%RBP),%R12 |
(4330) 0x510da2 MOV %RBX,%RSI |
(4330) 0x510da5 MOV -0x30(%RBP),%RBX |
(4330) 0x510da9 MOV 0x30(%RBP),%R13 |
(4330) 0x510dad JE 510d00 |
(4330) 0x510db3 JMP 510dc3 |
0x510db5 NOPW %CS:(%RAX,%RAX,1) |
(4330) 0x510dc0 XOR %R10D,%R10D |
(4330) 0x510dc3 ADD %R11,%R10 |
(4330) 0x510dc6 NOPW %CS:(%RAX,%RAX,1) |
(4331) 0x510dd0 MOV (%RDX,%R10,8),%RAX |
(4331) 0x510dd4 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4331) 0x510dd9 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4331) 0x510ddf INC %R10 |
(4331) 0x510de2 CMP %R10,%R9 |
(4331) 0x510de5 JNE 510dd0 |
(4330) 0x510de7 JMP 510d00 |
0x510dec NOPW %CS:(%RAX,%RAX,1) |
0x510dfb NOPL (%RAX,%RAX,1) |
0x510e00 VUCOMISD 0x1a0e8(%RIP),%XMM0 |
0x510e08 JNE 5111c0 |
0x510e0e CMP %R15,%R12 |
0x510e11 JGE 511a80 |
0x510e17 MOV %R12,%RAX |
0x510e1a NOT %RAX |
0x510e1d ADD %RAX,%R15 |
0x510e20 XOR %ESI,%ESI |
0x510e22 JMP 510e54 |
0x510e24 NOPW %CS:(%RAX,%RAX,1) |
0x510e33 NOPW %CS:(%RAX,%RAX,1) |
(4336) 0x510e40 VMOVSD %XMM0,(%R13,%RDI,8) |
(4336) 0x510e47 CMP %R15,%RSI |
(4336) 0x510e4a LEA 0x1(%RSI),%RSI |
(4336) 0x510e4e JE 511a80 |
(4336) 0x510e54 LEA (%R12,%RSI,1),%RDI |
(4336) 0x510e58 MOV (%RBX,%RDI,8),%R10 |
(4336) 0x510e5c MOV 0x8(%RBX,%RDI,8),%R8 |
(4336) 0x510e61 VXORPD %XMM0,%XMM0,%XMM0 |
(4336) 0x510e65 MOV %R8,%R11 |
(4336) 0x510e68 SUB %R10,%R11 |
(4336) 0x510e6b JLE 510e40 |
(4336) 0x510e6d MOV %R11,%R9 |
(4336) 0x510e70 AND $-0x4,%R9 |
(4336) 0x510e74 JE 510f00 |
(4336) 0x510e7a MOV %R15,%RBX |
(4336) 0x510e7d LEA -0x1(%R9),%R15 |
(4336) 0x510e81 LEA (%R14,%R10,8),%R13 |
(4336) 0x510e85 LEA (%RDX,%R10,8),%RAX |
(4336) 0x510e89 VXORPD %XMM0,%XMM0,%XMM0 |
(4336) 0x510e8d XOR %R12D,%R12D |
(4338) 0x510e90 VMOVUPD (%RAX,%R12,8),%YMM1 |
(4338) 0x510e96 VXORPD %XMM2,%XMM2,%XMM2 |
(4338) 0x510e9a KXNORW %K0,%K0,%K1 |
(4338) 0x510e9e VGATHERQPD (%RCX,%YMM1,8),%YMM2{%K1} |
(4338) 0x510ea5 VFNMADD231PD (%R13,%R12,8),%YMM2,%YMM0 |
(4338) 0x510eac ADD $0x4,%R12 |
(4338) 0x510eb0 CMP %R15,%R12 |
(4338) 0x510eb3 JBE 510e90 |
(4336) 0x510eb5 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(4336) 0x510ebb VADDPD %XMM1,%XMM0,%XMM0 |
(4336) 0x510ebf VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(4336) 0x510ec4 VADDSD %XMM1,%XMM0,%XMM0 |
(4336) 0x510ec8 CMP %R9,%R11 |
(4336) 0x510ecb MOV -0x38(%RBP),%R12 |
(4336) 0x510ecf MOV %RBX,%R15 |
(4336) 0x510ed2 MOV -0x30(%RBP),%RBX |
(4336) 0x510ed6 MOV 0x30(%RBP),%R13 |
(4336) 0x510eda JE 510e40 |
(4336) 0x510ee0 JMP 510f03 |
0x510ee2 NOPW %CS:(%RAX,%RAX,1) |
0x510ef1 NOPW %CS:(%RAX,%RAX,1) |
(4336) 0x510f00 XOR %R9D,%R9D |
(4336) 0x510f03 ADD %R10,%R9 |
(4336) 0x510f06 NOPW %CS:(%RAX,%RAX,1) |
(4337) 0x510f10 MOV (%RDX,%R9,8),%RAX |
(4337) 0x510f14 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4337) 0x510f19 VFNMADD231SD (%R14,%R9,8),%XMM1,%XMM0 |
(4337) 0x510f1f INC %R9 |
(4337) 0x510f22 CMP %R9,%R8 |
(4337) 0x510f25 JNE 510f10 |
(4336) 0x510f27 JMP 510e40 |
0x510f2c NOPW %CS:(%RAX,%RAX,1) |
0x510f3b NOPL (%RAX,%RAX,1) |
0x510f40 VUCOMISD 0x190c8(%RIP),%XMM5 |
0x510f48 JNE 511300 |
0x510f4e VUCOMISD 0x190ba(%RIP),%XMM0 |
0x510f56 JNE 511440 |
0x510f5c CMP %RSI,%R12 |
0x510f5f JGE 511a80 |
0x510f65 MOV %R12,%RAX |
0x510f68 NOT %RAX |
0x510f6b ADD %RAX,%RSI |
0x510f6e XOR %EDI,%EDI |
0x510f70 MOV %RSI,-0x30(%RBP) |
0x510f74 JMP 510f94 |
0x510f76 NOPW %CS:(%RAX,%RAX,1) |
(4321) 0x510f80 VMOVSD %XMM0,(%R13,%R8,8) |
(4321) 0x510f87 CMP %RSI,%RDI |
(4321) 0x510f8a LEA 0x1(%RDI),%RDI |
(4321) 0x510f8e JE 511a80 |
(4321) 0x510f94 LEA (%R12,%RDI,1),%R8 |
(4321) 0x510f98 MOV 0x28(%RBP),%RAX |
(4321) 0x510f9c VMOVSD (%RAX,%R8,8),%XMM0 |
(4321) 0x510fa2 MOV (%RBX,%R8,8),%R11 |
(4321) 0x510fa6 MOV 0x8(%RBX,%R8,8),%R9 |
(4321) 0x510fab MOV %R9,%R15 |
(4321) 0x510fae SUB %R11,%R15 |
(4321) 0x510fb1 JLE 510f80 |
(4321) 0x510fb3 MOV %R15,%R10 |
(4321) 0x510fb6 AND $-0x4,%R10 |
(4321) 0x510fba JE 511040 |
(4321) 0x510fc0 LEA -0x1(%R10),%R13 |
(4321) 0x510fc4 LEA (%R14,%R11,8),%RSI |
(4321) 0x510fc8 LEA (%RDX,%R11,8),%RAX |
(4321) 0x510fcc VXORPD %XMM1,%XMM1,%XMM1 |
(4321) 0x510fd0 XOR %R12D,%R12D |
(4321) 0x510fd3 NOPW %CS:(%RAX,%RAX,1) |
(4323) 0x510fe0 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4323) 0x510fe6 VXORPD %XMM3,%XMM3,%XMM3 |
(4323) 0x510fea KXNORW %K0,%K0,%K1 |
(4323) 0x510fee VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4323) 0x510ff5 VFMADD231PD (%RSI,%R12,8),%YMM3,%YMM1 |
(4323) 0x510ffb ADD $0x4,%R12 |
(4323) 0x510fff CMP %R13,%R12 |
(4323) 0x511002 JBE 510fe0 |
(4321) 0x511004 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4321) 0x51100a VADDPD %XMM2,%XMM1,%XMM1 |
(4321) 0x51100e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4321) 0x511013 VADDSD %XMM2,%XMM1,%XMM1 |
(4321) 0x511017 VADDSD %XMM1,%XMM0,%XMM0 |
(4321) 0x51101b CMP %R10,%R15 |
(4321) 0x51101e MOV -0x38(%RBP),%R12 |
(4321) 0x511022 MOV -0x30(%RBP),%RSI |
(4321) 0x511026 MOV 0x30(%RBP),%R13 |
(4321) 0x51102a JE 510f80 |
(4321) 0x511030 JMP 511043 |
0x511032 NOPW %CS:(%RAX,%RAX,1) |
(4321) 0x511040 XOR %R10D,%R10D |
(4321) 0x511043 ADD %R11,%R10 |
(4321) 0x511046 NOPW %CS:(%RAX,%RAX,1) |
(4322) 0x511050 MOV (%RDX,%R10,8),%RAX |
(4322) 0x511054 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4322) 0x511059 VFMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(4322) 0x51105f INC %R10 |
(4322) 0x511062 CMP %R10,%R9 |
(4322) 0x511065 JNE 511050 |
(4321) 0x511067 JMP 510f80 |
0x51106c NOPW %CS:(%RAX,%RAX,1) |
0x51107b NOPL (%RAX,%RAX,1) |
0x511080 VUCOMISD 0x19e68(%RIP),%XMM0 |
0x511088 JNE 511580 |
0x51108e CMP %RSI,%R12 |
0x511091 JGE 511a80 |
0x511097 MOV %R12,%RAX |
0x51109a NOT %RAX |
0x51109d ADD %RAX,%RSI |
0x5110a0 XOR %EDI,%EDI |
0x5110a2 MOV %RSI,-0x30(%RBP) |
0x5110a6 JMP 5110d4 |
0x5110a8 NOPW %CS:(%RAX,%RAX,1) |
0x5110b7 NOPW (%RAX,%RAX,1) |
(4327) 0x5110c0 VMOVSD %XMM0,(%R13,%R8,8) |
(4327) 0x5110c7 CMP %RSI,%RDI |
(4327) 0x5110ca LEA 0x1(%RDI),%RDI |
(4327) 0x5110ce JE 511a80 |
(4327) 0x5110d4 LEA (%R12,%RDI,1),%R8 |
(4327) 0x5110d8 MOV 0x28(%RBP),%RAX |
(4327) 0x5110dc VMOVSD (%RAX,%R8,8),%XMM0 |
(4327) 0x5110e2 MOV (%RBX,%R8,8),%R11 |
(4327) 0x5110e6 MOV 0x8(%RBX,%R8,8),%R9 |
(4327) 0x5110eb MOV %R9,%R15 |
(4327) 0x5110ee SUB %R11,%R15 |
(4327) 0x5110f1 JLE 5110c0 |
(4327) 0x5110f3 MOV %R15,%R10 |
(4327) 0x5110f6 AND $-0x4,%R10 |
(4327) 0x5110fa JE 511180 |
(4327) 0x511100 LEA -0x1(%R10),%R13 |
(4327) 0x511104 LEA (%R14,%R11,8),%RSI |
(4327) 0x511108 LEA (%RDX,%R11,8),%RAX |
(4327) 0x51110c VXORPD %XMM1,%XMM1,%XMM1 |
(4327) 0x511110 XOR %R12D,%R12D |
(4327) 0x511113 NOPW %CS:(%RAX,%RAX,1) |
(4329) 0x511120 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4329) 0x511126 KXNORW %K0,%K0,%K1 |
(4329) 0x51112a VXORPD %XMM3,%XMM3,%XMM3 |
(4329) 0x51112e VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4329) 0x511135 VFNMADD231PD (%RSI,%R12,8),%YMM3,%YMM1 |
(4329) 0x51113b ADD $0x4,%R12 |
(4329) 0x51113f CMP %R13,%R12 |
(4329) 0x511142 JBE 511120 |
(4327) 0x511144 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4327) 0x51114a VADDPD %XMM2,%XMM1,%XMM1 |
(4327) 0x51114e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4327) 0x511153 VADDSD %XMM2,%XMM1,%XMM1 |
(4327) 0x511157 VADDSD %XMM1,%XMM0,%XMM0 |
(4327) 0x51115b CMP %R10,%R15 |
(4327) 0x51115e MOV -0x38(%RBP),%R12 |
(4327) 0x511162 MOV -0x30(%RBP),%RSI |
(4327) 0x511166 MOV 0x30(%RBP),%R13 |
(4327) 0x51116a JE 5110c0 |
(4327) 0x511170 JMP 511183 |
0x511172 NOPW %CS:(%RAX,%RAX,1) |
(4327) 0x511180 XOR %R10D,%R10D |
(4327) 0x511183 ADD %R11,%R10 |
(4327) 0x511186 NOPW %CS:(%RAX,%RAX,1) |
(4328) 0x511190 MOV (%RDX,%R10,8),%RAX |
(4328) 0x511194 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4328) 0x511199 VFNMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(4328) 0x51119f INC %R10 |
(4328) 0x5111a2 CMP %R10,%R9 |
(4328) 0x5111a5 JNE 511190 |
(4327) 0x5111a7 JMP 5110c0 |
0x5111ac NOPW %CS:(%RAX,%RAX,1) |
0x5111bb NOPL (%RAX,%RAX,1) |
0x5111c0 CMP %R15,%R12 |
0x5111c3 JGE 511a80 |
0x5111c9 MOV %R12,%RAX |
0x5111cc NOT %RAX |
0x5111cf ADD %RAX,%R15 |
0x5111d2 XOR %ESI,%ESI |
0x5111d4 JMP 511218 |
0x5111d6 NOPW %CS:(%RAX,%RAX,1) |
0x5111e5 NOPW %CS:(%RAX,%RAX,1) |
0x5111f4 NOPW %CS:(%RAX,%RAX,1) |
(4333) 0x511200 VMULSD %XMM0,%XMM1,%XMM1 |
(4333) 0x511204 VMOVSD %XMM1,(%R13,%RDI,8) |
(4333) 0x51120b CMP %R15,%RSI |
(4333) 0x51120e LEA 0x1(%RSI),%RSI |
(4333) 0x511212 JE 511a80 |
(4333) 0x511218 LEA (%R12,%RSI,1),%RDI |
(4333) 0x51121c MOV (%RBX,%RDI,8),%R10 |
(4333) 0x511220 MOV 0x8(%RBX,%RDI,8),%R8 |
(4333) 0x511225 VXORPD %XMM1,%XMM1,%XMM1 |
(4333) 0x511229 MOV %R8,%R11 |
(4333) 0x51122c SUB %R10,%R11 |
(4333) 0x51122f JLE 511200 |
(4333) 0x511231 MOV %R11,%R9 |
(4333) 0x511234 AND $-0x4,%R9 |
(4333) 0x511238 JE 5112c0 |
(4333) 0x51123e MOV %R15,%RBX |
(4333) 0x511241 LEA -0x1(%R9),%R15 |
(4333) 0x511245 LEA (%R14,%R10,8),%R13 |
(4333) 0x511249 LEA (%RDX,%R10,8),%RAX |
(4333) 0x51124d VXORPD %XMM1,%XMM1,%XMM1 |
(4333) 0x511251 XOR %R12D,%R12D |
(4333) 0x511254 NOPW %CS:(%RAX,%RAX,1) |
(4335) 0x511260 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4335) 0x511266 VXORPD %XMM3,%XMM3,%XMM3 |
(4335) 0x51126a KXNORW %K0,%K0,%K1 |
(4335) 0x51126e VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4335) 0x511275 VFMADD231PD (%R13,%R12,8),%YMM3,%YMM1 |
(4335) 0x51127c ADD $0x4,%R12 |
(4335) 0x511280 CMP %R15,%R12 |
(4335) 0x511283 JBE 511260 |
(4333) 0x511285 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4333) 0x51128b VADDPD %XMM2,%XMM1,%XMM1 |
(4333) 0x51128f VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4333) 0x511294 VADDSD %XMM2,%XMM1,%XMM1 |
(4333) 0x511298 CMP %R9,%R11 |
(4333) 0x51129b MOV -0x38(%RBP),%R12 |
(4333) 0x51129f MOV %RBX,%R15 |
(4333) 0x5112a2 MOV -0x30(%RBP),%RBX |
(4333) 0x5112a6 MOV 0x30(%RBP),%R13 |
(4333) 0x5112aa JE 511200 |
(4333) 0x5112b0 JMP 5112c3 |
0x5112b2 NOPW %CS:(%RAX,%RAX,1) |
(4333) 0x5112c0 XOR %R9D,%R9D |
(4333) 0x5112c3 ADD %R10,%R9 |
(4333) 0x5112c6 NOPW %CS:(%RAX,%RAX,1) |
(4334) 0x5112d0 MOV (%RDX,%R9,8),%RAX |
(4334) 0x5112d4 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4334) 0x5112d9 VFMADD231SD (%R14,%R9,8),%XMM2,%XMM1 |
(4334) 0x5112df INC %R9 |
(4334) 0x5112e2 CMP %R9,%R8 |
(4334) 0x5112e5 JNE 5112d0 |
(4333) 0x5112e7 JMP 511200 |
0x5112ec NOPW %CS:(%RAX,%RAX,1) |
0x5112fb NOPL (%RAX,%RAX,1) |
0x511300 VUCOMISD 0x18d08(%RIP),%XMM0 |
0x511308 JNE 5116c0 |
0x51130e CMP %RSI,%R12 |
0x511311 JGE 511a80 |
0x511317 MOV %R12,%RAX |
0x51131a NOT %RAX |
0x51131d ADD %RAX,%RSI |
0x511320 XOR %EDI,%EDI |
0x511322 MOV %RSI,-0x30(%RBP) |
0x511326 JMP 511354 |
0x511328 NOPW %CS:(%RAX,%RAX,1) |
0x511337 NOPW (%RAX,%RAX,1) |
(4312) 0x511340 VMOVSD %XMM0,(%R13,%R8,8) |
(4312) 0x511347 CMP %RSI,%RDI |
(4312) 0x51134a LEA 0x1(%RDI),%RDI |
(4312) 0x51134e JE 511a80 |
(4312) 0x511354 LEA (%R12,%RDI,1),%R8 |
(4312) 0x511358 MOV 0x28(%RBP),%RAX |
(4312) 0x51135c VMULSD (%RAX,%R8,8),%XMM5,%XMM0 |
(4312) 0x511362 MOV (%RBX,%R8,8),%R11 |
(4312) 0x511366 MOV 0x8(%RBX,%R8,8),%R9 |
(4312) 0x51136b MOV %R9,%R15 |
(4312) 0x51136e SUB %R11,%R15 |
(4312) 0x511371 JLE 511340 |
(4312) 0x511373 MOV %R15,%R10 |
(4312) 0x511376 AND $-0x4,%R10 |
(4312) 0x51137a JE 511400 |
(4312) 0x511380 LEA -0x1(%R10),%R13 |
(4312) 0x511384 LEA (%R14,%R11,8),%RSI |
(4312) 0x511388 LEA (%RDX,%R11,8),%RAX |
(4312) 0x51138c VXORPD %XMM1,%XMM1,%XMM1 |
(4312) 0x511390 XOR %R12D,%R12D |
(4312) 0x511393 NOPW %CS:(%RAX,%RAX,1) |
(4314) 0x5113a0 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4314) 0x5113a6 KXNORW %K0,%K0,%K1 |
(4314) 0x5113aa VXORPD %XMM3,%XMM3,%XMM3 |
(4314) 0x5113ae VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4314) 0x5113b5 VFMADD231PD (%RSI,%R12,8),%YMM3,%YMM1 |
(4314) 0x5113bb ADD $0x4,%R12 |
(4314) 0x5113bf CMP %R13,%R12 |
(4314) 0x5113c2 JBE 5113a0 |
(4312) 0x5113c4 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4312) 0x5113ca VADDPD %XMM2,%XMM1,%XMM1 |
(4312) 0x5113ce VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4312) 0x5113d3 VADDSD %XMM2,%XMM1,%XMM1 |
(4312) 0x5113d7 VADDSD %XMM1,%XMM0,%XMM0 |
(4312) 0x5113db CMP %R10,%R15 |
(4312) 0x5113de MOV -0x38(%RBP),%R12 |
(4312) 0x5113e2 MOV -0x30(%RBP),%RSI |
(4312) 0x5113e6 MOV 0x30(%RBP),%R13 |
(4312) 0x5113ea JE 511340 |
(4312) 0x5113f0 JMP 511403 |
0x5113f2 NOPW %CS:(%RAX,%RAX,1) |
(4312) 0x511400 XOR %R10D,%R10D |
(4312) 0x511403 ADD %R11,%R10 |
(4312) 0x511406 NOPW %CS:(%RAX,%RAX,1) |
(4313) 0x511410 MOV (%RDX,%R10,8),%RAX |
(4313) 0x511414 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4313) 0x511419 VFMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(4313) 0x51141f INC %R10 |
(4313) 0x511422 CMP %R10,%R9 |
(4313) 0x511425 JNE 511410 |
(4312) 0x511427 JMP 511340 |
0x51142c NOPW %CS:(%RAX,%RAX,1) |
0x51143b NOPL (%RAX,%RAX,1) |
0x511440 VUCOMISD 0x19aa8(%RIP),%XMM0 |
0x511448 JNE 511800 |
0x51144e CMP %RSI,%R12 |
0x511451 JGE 511a80 |
0x511457 MOV %R12,%RAX |
0x51145a NOT %RAX |
0x51145d ADD %RAX,%RSI |
0x511460 XOR %EDI,%EDI |
0x511462 VMOVDDUP 0x19836(%RIP),%XMM0 |
0x51146a MOV %RSI,-0x30(%RBP) |
0x51146e JMP 511494 |
0x511470 NOPW %CS:(%RAX,%RAX,1) |
0x51147f NOP |
(4318) 0x511480 VMOVSD %XMM1,(%R13,%R8,8) |
(4318) 0x511487 CMP %RSI,%RDI |
(4318) 0x51148a LEA 0x1(%RDI),%RDI |
(4318) 0x51148e JE 511a80 |
(4318) 0x511494 LEA (%R12,%RDI,1),%R8 |
(4318) 0x511498 MOV 0x28(%RBP),%RAX |
(4318) 0x51149c VMOVSD (%RAX,%R8,8),%XMM1 |
(4318) 0x5114a2 VXORPD %XMM0,%XMM1,%XMM1 |
(4318) 0x5114a6 MOV (%RBX,%R8,8),%R11 |
(4318) 0x5114aa MOV 0x8(%RBX,%R8,8),%R9 |
(4318) 0x5114af MOV %R9,%R15 |
(4318) 0x5114b2 SUB %R11,%R15 |
(4318) 0x5114b5 JLE 511480 |
(4318) 0x5114b7 MOV %R15,%R10 |
(4318) 0x5114ba AND $-0x4,%R10 |
(4318) 0x5114be JE 511540 |
(4318) 0x5114c4 LEA -0x1(%R10),%R13 |
(4318) 0x5114c8 LEA (%R14,%R11,8),%RSI |
(4318) 0x5114cc LEA (%RDX,%R11,8),%RAX |
(4318) 0x5114d0 VXORPD %XMM2,%XMM2,%XMM2 |
(4318) 0x5114d4 XOR %R12D,%R12D |
(4318) 0x5114d7 NOPW (%RAX,%RAX,1) |
(4320) 0x5114e0 VMOVUPD (%RAX,%R12,8),%YMM3 |
(4320) 0x5114e6 VXORPD %XMM4,%XMM4,%XMM4 |
(4320) 0x5114ea KXNORW %K0,%K0,%K1 |
(4320) 0x5114ee VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4320) 0x5114f5 VFNMADD231PD (%RSI,%R12,8),%YMM4,%YMM2 |
(4320) 0x5114fb ADD $0x4,%R12 |
(4320) 0x5114ff CMP %R13,%R12 |
(4320) 0x511502 JBE 5114e0 |
(4318) 0x511504 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4318) 0x51150a VADDPD %XMM3,%XMM2,%XMM2 |
(4318) 0x51150e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4318) 0x511513 VADDSD %XMM3,%XMM2,%XMM2 |
(4318) 0x511517 VADDSD %XMM2,%XMM1,%XMM1 |
(4318) 0x51151b CMP %R10,%R15 |
(4318) 0x51151e MOV -0x38(%RBP),%R12 |
(4318) 0x511522 MOV -0x30(%RBP),%RSI |
(4318) 0x511526 MOV 0x30(%RBP),%R13 |
(4318) 0x51152a JE 511480 |
(4318) 0x511530 JMP 511543 |
0x511532 NOPW %CS:(%RAX,%RAX,1) |
(4318) 0x511540 XOR %R10D,%R10D |
(4318) 0x511543 ADD %R11,%R10 |
(4318) 0x511546 NOPW %CS:(%RAX,%RAX,1) |
(4319) 0x511550 MOV (%RDX,%R10,8),%RAX |
(4319) 0x511554 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4319) 0x511559 VFNMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4319) 0x51155f INC %R10 |
(4319) 0x511562 CMP %R10,%R9 |
(4319) 0x511565 JNE 511550 |
(4318) 0x511567 JMP 511480 |
0x51156c NOPW %CS:(%RAX,%RAX,1) |
0x51157b NOPL (%RAX,%RAX,1) |
0x511580 CMP %RSI,%R12 |
0x511583 JGE 511a80 |
0x511589 MOV %R12,%RAX |
0x51158c NOT %RAX |
0x51158f ADD %RAX,%RSI |
0x511592 XOR %EDI,%EDI |
0x511594 VMOVDDUP 0x19704(%RIP),%XMM1 |
0x51159c MOV %RSI,-0x30(%RBP) |
0x5115a0 JMP 5115d8 |
0x5115a2 NOPW %CS:(%RAX,%RAX,1) |
0x5115b1 NOPW %CS:(%RAX,%RAX,1) |
(4324) 0x5115c0 VMULSD %XMM0,%XMM2,%XMM2 |
(4324) 0x5115c4 VMOVSD %XMM2,(%R13,%R8,8) |
(4324) 0x5115cb CMP %RSI,%RDI |
(4324) 0x5115ce LEA 0x1(%RDI),%RDI |
(4324) 0x5115d2 JE 511a80 |
(4324) 0x5115d8 LEA (%R12,%RDI,1),%R8 |
(4324) 0x5115dc MOV 0x28(%RBP),%RAX |
(4324) 0x5115e0 VMOVSD (%RAX,%R8,8),%XMM2 |
(4324) 0x5115e6 VXORPD %XMM1,%XMM2,%XMM2 |
(4324) 0x5115ea MOV (%RBX,%R8,8),%R11 |
(4324) 0x5115ee MOV 0x8(%RBX,%R8,8),%R9 |
(4324) 0x5115f3 MOV %R9,%R15 |
(4324) 0x5115f6 SUB %R11,%R15 |
(4324) 0x5115f9 JLE 5115c0 |
(4324) 0x5115fb MOV %R15,%R10 |
(4324) 0x5115fe AND $-0x4,%R10 |
(4324) 0x511602 JE 511680 |
(4324) 0x511608 LEA -0x1(%R10),%R13 |
(4324) 0x51160c LEA (%R14,%R11,8),%RSI |
(4324) 0x511610 LEA (%RDX,%R11,8),%RAX |
(4324) 0x511614 VXORPD %XMM3,%XMM3,%XMM3 |
(4324) 0x511618 XOR %R12D,%R12D |
(4324) 0x51161b NOPL (%RAX,%RAX,1) |
(4326) 0x511620 VMOVUPD (%RAX,%R12,8),%YMM4 |
(4326) 0x511626 VXORPD %XMM5,%XMM5,%XMM5 |
(4326) 0x51162a KXNORW %K0,%K0,%K1 |
(4326) 0x51162e VGATHERQPD (%RCX,%YMM4,8),%YMM5{%K1} |
(4326) 0x511635 VFMADD231PD (%RSI,%R12,8),%YMM5,%YMM3 |
(4326) 0x51163b ADD $0x4,%R12 |
(4326) 0x51163f CMP %R13,%R12 |
(4326) 0x511642 JBE 511620 |
(4324) 0x511644 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(4324) 0x51164a VADDPD %XMM4,%XMM3,%XMM3 |
(4324) 0x51164e VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(4324) 0x511653 VADDSD %XMM4,%XMM3,%XMM3 |
(4324) 0x511657 VADDSD %XMM3,%XMM2,%XMM2 |
(4324) 0x51165b CMP %R10,%R15 |
(4324) 0x51165e MOV -0x38(%RBP),%R12 |
(4324) 0x511662 MOV -0x30(%RBP),%RSI |
(4324) 0x511666 MOV 0x30(%RBP),%R13 |
(4324) 0x51166a JE 5115c0 |
(4324) 0x511670 JMP 511683 |
0x511672 NOPW %CS:(%RAX,%RAX,1) |
(4324) 0x511680 XOR %R10D,%R10D |
(4324) 0x511683 ADD %R11,%R10 |
(4324) 0x511686 NOPW %CS:(%RAX,%RAX,1) |
(4325) 0x511690 MOV (%RDX,%R10,8),%RAX |
(4325) 0x511694 VMOVSD (%RCX,%RAX,8),%XMM3 |
(4325) 0x511699 VFMADD231SD (%R14,%R10,8),%XMM3,%XMM2 |
(4325) 0x51169f INC %R10 |
(4325) 0x5116a2 CMP %R10,%R9 |
(4325) 0x5116a5 JNE 511690 |
(4324) 0x5116a7 JMP 5115c0 |
0x5116ac NOPW %CS:(%RAX,%RAX,1) |
0x5116bb NOPL (%RAX,%RAX,1) |
0x5116c0 VUCOMISD 0x19828(%RIP),%XMM0 |
0x5116c8 JNE 511940 |
0x5116ce CMP %RSI,%R12 |
0x5116d1 JGE 511a80 |
0x5116d7 VXORPD 0x195bf(%RIP){1to2},%XMM5,%XMM0 |
0x5116e1 MOV %R12,%RAX |
0x5116e4 NOT %RAX |
0x5116e7 ADD %RAX,%RSI |
0x5116ea XOR %EDI,%EDI |
0x5116ec JMP 511714 |
0x5116ee NOPW %CS:(%RAX,%RAX,1) |
0x5116fd NOPL (%RAX) |
(4309) 0x511700 VMOVSD %XMM1,(%R13,%R8,8) |
(4309) 0x511707 CMP %RSI,%RDI |
(4309) 0x51170a LEA 0x1(%RDI),%RDI |
(4309) 0x51170e JE 511a80 |
(4309) 0x511714 LEA (%R12,%RDI,1),%R8 |
(4309) 0x511718 MOV 0x28(%RBP),%RAX |
(4309) 0x51171c VMULSD (%RAX,%R8,8),%XMM0,%XMM1 |
(4309) 0x511722 MOV (%RBX,%R8,8),%RAX |
(4309) 0x511726 MOV 0x8(%RBX,%R8,8),%R9 |
(4309) 0x51172b MOV %R9,%R15 |
(4309) 0x51172e SUB %RAX,%R15 |
(4309) 0x511731 JLE 511700 |
(4309) 0x511733 MOV %R15,%R10 |
(4309) 0x511736 AND $-0x4,%R10 |
(4309) 0x51173a JE 5117c0 |
(4309) 0x511740 MOV %RSI,%RBX |
(4309) 0x511743 LEA -0x1(%R10),%R13 |
(4309) 0x511747 LEA (%R14,%RAX,8),%RSI |
(4309) 0x51174b MOV %RAX,-0x38(%RBP) |
(4309) 0x51174f LEA (%RDX,%RAX,8),%RAX |
(4309) 0x511753 VXORPD %XMM2,%XMM2,%XMM2 |
(4309) 0x511757 XOR %R11D,%R11D |
(4309) 0x51175a NOPW (%RAX,%RAX,1) |
(4311) 0x511760 VMOVUPD (%RAX,%R11,8),%YMM3 |
(4311) 0x511766 VXORPD %XMM4,%XMM4,%XMM4 |
(4311) 0x51176a KXNORW %K0,%K0,%K1 |
(4311) 0x51176e VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4311) 0x511775 VFNMADD231PD (%RSI,%R11,8),%YMM4,%YMM2 |
(4311) 0x51177b ADD $0x4,%R11 |
(4311) 0x51177f CMP %R13,%R11 |
(4311) 0x511782 JBE 511760 |
(4309) 0x511784 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4309) 0x51178a VADDPD %XMM3,%XMM2,%XMM2 |
(4309) 0x51178e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4309) 0x511793 VADDSD %XMM3,%XMM2,%XMM2 |
(4309) 0x511797 VADDSD %XMM2,%XMM1,%XMM1 |
(4309) 0x51179b CMP %R10,%R15 |
(4309) 0x51179e MOV %RBX,%RSI |
(4309) 0x5117a1 MOV -0x30(%RBP),%RBX |
(4309) 0x5117a5 MOV 0x30(%RBP),%R13 |
(4309) 0x5117a9 MOV -0x38(%RBP),%RAX |
(4309) 0x5117ad JE 511700 |
(4309) 0x5117b3 JMP 5117c3 |
0x5117b5 NOPW %CS:(%RAX,%RAX,1) |
(4309) 0x5117c0 XOR %R10D,%R10D |
(4309) 0x5117c3 ADD %RAX,%R10 |
(4309) 0x5117c6 NOPW %CS:(%RAX,%RAX,1) |
(4310) 0x5117d0 MOV (%RDX,%R10,8),%RAX |
(4310) 0x5117d4 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4310) 0x5117d9 VFNMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4310) 0x5117df INC %R10 |
(4310) 0x5117e2 CMP %R10,%R9 |
(4310) 0x5117e5 JNE 5117d0 |
(4309) 0x5117e7 JMP 511700 |
0x5117ec NOPW %CS:(%RAX,%RAX,1) |
0x5117fb NOPL (%RAX,%RAX,1) |
0x511800 CMP %RSI,%R12 |
0x511803 JGE 511a80 |
0x511809 MOV %R12,%RAX |
0x51180c NOT %RAX |
0x51180f ADD %RAX,%RSI |
0x511812 XOR %EDI,%EDI |
0x511814 MOV %RSI,-0x30(%RBP) |
0x511818 JMP 511858 |
0x51181a NOPW %CS:(%RAX,%RAX,1) |
0x511829 NOPW %CS:(%RAX,%RAX,1) |
0x511838 NOPL (%RAX,%RAX,1) |
(4315) 0x511840 VMULSD %XMM0,%XMM1,%XMM1 |
(4315) 0x511844 VMOVSD %XMM1,(%R13,%R8,8) |
(4315) 0x51184b CMP %RSI,%RDI |
(4315) 0x51184e LEA 0x1(%RDI),%RDI |
(4315) 0x511852 JE 511a80 |
(4315) 0x511858 LEA (%R12,%RDI,1),%R8 |
(4315) 0x51185c MOV 0x28(%RBP),%RAX |
(4315) 0x511860 VMOVSD (%RAX,%R8,8),%XMM1 |
(4315) 0x511866 MOV (%RBX,%R8,8),%R11 |
(4315) 0x51186a MOV 0x8(%RBX,%R8,8),%R9 |
(4315) 0x51186f MOV %R9,%R15 |
(4315) 0x511872 SUB %R11,%R15 |
(4315) 0x511875 JLE 511840 |
(4315) 0x511877 MOV %R15,%R10 |
(4315) 0x51187a AND $-0x4,%R10 |
(4315) 0x51187e JE 511900 |
(4315) 0x511884 LEA -0x1(%R10),%R13 |
(4315) 0x511888 LEA (%R14,%R11,8),%RSI |
(4315) 0x51188c LEA (%RDX,%R11,8),%RAX |
(4315) 0x511890 VXORPD %XMM2,%XMM2,%XMM2 |
(4315) 0x511894 XOR %R12D,%R12D |
(4315) 0x511897 NOPW (%RAX,%RAX,1) |
(4317) 0x5118a0 VMOVUPD (%RAX,%R12,8),%YMM3 |
(4317) 0x5118a6 KXNORW %K0,%K0,%K1 |
(4317) 0x5118aa VXORPD %XMM4,%XMM4,%XMM4 |
(4317) 0x5118ae VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4317) 0x5118b5 VFMADD231PD (%RSI,%R12,8),%YMM4,%YMM2 |
(4317) 0x5118bb ADD $0x4,%R12 |
(4317) 0x5118bf CMP %R13,%R12 |
(4317) 0x5118c2 JBE 5118a0 |
(4315) 0x5118c4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4315) 0x5118ca VADDPD %XMM3,%XMM2,%XMM2 |
(4315) 0x5118ce VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4315) 0x5118d3 VADDSD %XMM3,%XMM2,%XMM2 |
(4315) 0x5118d7 VADDSD %XMM2,%XMM1,%XMM1 |
(4315) 0x5118db CMP %R10,%R15 |
(4315) 0x5118de MOV -0x38(%RBP),%R12 |
(4315) 0x5118e2 MOV -0x30(%RBP),%RSI |
(4315) 0x5118e6 MOV 0x30(%RBP),%R13 |
(4315) 0x5118ea JE 511840 |
(4315) 0x5118f0 JMP 511903 |
0x5118f2 NOPW %CS:(%RAX,%RAX,1) |
(4315) 0x511900 XOR %R10D,%R10D |
(4315) 0x511903 ADD %R11,%R10 |
(4315) 0x511906 NOPW %CS:(%RAX,%RAX,1) |
(4316) 0x511910 MOV (%RDX,%R10,8),%RAX |
(4316) 0x511914 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4316) 0x511919 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4316) 0x51191f INC %R10 |
(4316) 0x511922 CMP %R10,%R9 |
(4316) 0x511925 JNE 511910 |
(4315) 0x511927 JMP 511840 |
0x51192c NOPW %CS:(%RAX,%RAX,1) |
0x51193b NOPL (%RAX,%RAX,1) |
0x511940 CMP %RSI,%R12 |
0x511943 JGE 511a80 |
0x511949 MOV %R12,%RAX |
0x51194c NOT %RAX |
0x51194f ADD %RAX,%RSI |
0x511952 XOR %EDI,%EDI |
0x511954 JMP 511998 |
0x511956 NOPW %CS:(%RAX,%RAX,1) |
0x511965 NOPW %CS:(%RAX,%RAX,1) |
0x511974 NOPW %CS:(%RAX,%RAX,1) |
(4306) 0x511980 VMULSD %XMM0,%XMM1,%XMM1 |
(4306) 0x511984 VMOVSD %XMM1,(%R13,%R8,8) |
(4306) 0x51198b CMP %RSI,%RDI |
(4306) 0x51198e LEA 0x1(%RDI),%RDI |
(4306) 0x511992 JE 511a80 |
(4306) 0x511998 LEA (%R12,%RDI,1),%R8 |
(4306) 0x51199c MOV 0x28(%RBP),%RAX |
(4306) 0x5119a0 VMULSD (%RAX,%R8,8),%XMM5,%XMM1 |
(4306) 0x5119a6 MOV (%RBX,%R8,8),%RAX |
(4306) 0x5119aa MOV 0x8(%RBX,%R8,8),%R9 |
(4306) 0x5119af MOV %R9,%R15 |
(4306) 0x5119b2 SUB %RAX,%R15 |
(4306) 0x5119b5 JLE 511980 |
(4306) 0x5119b7 MOV %R15,%R10 |
(4306) 0x5119ba AND $-0x4,%R10 |
(4306) 0x5119be JE 511a40 |
(4306) 0x5119c4 MOV %RSI,%RBX |
(4306) 0x5119c7 LEA -0x1(%R10),%R13 |
(4306) 0x5119cb LEA (%R14,%RAX,8),%RSI |
(4306) 0x5119cf MOV %RAX,-0x38(%RBP) |
(4306) 0x5119d3 LEA (%RDX,%RAX,8),%R11 |
(4306) 0x5119d7 VXORPD %XMM2,%XMM2,%XMM2 |
(4306) 0x5119db XOR %EAX,%EAX |
(4306) 0x5119dd NOPL (%RAX) |
(4308) 0x5119e0 VMOVUPD (%R11,%RAX,8),%YMM3 |
(4308) 0x5119e6 VXORPD %XMM4,%XMM4,%XMM4 |
(4308) 0x5119ea KXNORW %K0,%K0,%K1 |
(4308) 0x5119ee VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4308) 0x5119f5 VFMADD231PD (%RSI,%RAX,8),%YMM4,%YMM2 |
(4308) 0x5119fb ADD $0x4,%RAX |
(4308) 0x5119ff CMP %R13,%RAX |
(4308) 0x511a02 JBE 5119e0 |
(4306) 0x511a04 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4306) 0x511a0a VADDPD %XMM3,%XMM2,%XMM2 |
(4306) 0x511a0e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4306) 0x511a13 VADDSD %XMM3,%XMM2,%XMM2 |
(4306) 0x511a17 VADDSD %XMM2,%XMM1,%XMM1 |
(4306) 0x511a1b CMP %R10,%R15 |
(4306) 0x511a1e MOV %RBX,%RSI |
(4306) 0x511a21 MOV -0x30(%RBP),%RBX |
(4306) 0x511a25 MOV 0x30(%RBP),%R13 |
(4306) 0x511a29 MOV -0x38(%RBP),%RAX |
(4306) 0x511a2d JE 511980 |
(4306) 0x511a33 JMP 511a43 |
0x511a35 NOPW %CS:(%RAX,%RAX,1) |
(4306) 0x511a40 XOR %R10D,%R10D |
(4306) 0x511a43 ADD %RAX,%R10 |
(4306) 0x511a46 NOPW %CS:(%RAX,%RAX,1) |
(4307) 0x511a50 MOV (%RDX,%R10,8),%RAX |
(4307) 0x511a54 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4307) 0x511a59 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4307) 0x511a5f INC %R10 |
(4307) 0x511a62 CMP %R10,%R9 |
(4307) 0x511a65 JNE 511a50 |
(4306) 0x511a67 JMP 511980 |
0x511a6c NOPW %CS:(%RAX,%RAX,1) |
0x511a7b NOPL (%RAX,%RAX,1) |
0x511a80 ADD $0x18,%RSP |
0x511a84 POP %RBX |
0x511a85 POP %R12 |
0x511a87 POP %R13 |
0x511a89 POP %R14 |
0x511a8b POP %R15 |
0x511a8d POP %RBP |
0x511a8e VZEROUPPER |
0x511a91 RET |
0x511a92 NOPW %CS:(%RAX,%RAX,1) |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 259 |
nb uops | 278 |
loop length | 1503 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 7 |
micro-operation queue | 46.33 cycles |
front end | 46.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.07 | 10.33 | 10.33 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 10.33 |
cycles | 20.00 | 19.07 | 10.33 | 10.33 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 10.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 44.93 |
Stall cycles | 0.00 |
Front-end | 46.33 |
Dispatch | 20.00 |
Overall L1 | 46.33 |
all | 1% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 10% |
load | 5% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 4% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 10% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 13% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 50efa0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 50f060 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 510ad7 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x67> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x52150(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x53be7d,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x53de03,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51b970 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x53e799,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51e980 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 510ae5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 510b13 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x52114(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x53be7d,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x53e81c,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51b970 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x53e799,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51e980 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 510b22 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 510b55 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x520d7(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x53be7d,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x53e83e,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51b970 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x53e799,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51e980 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD -0x38(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 510cc0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x250> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x1948c(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 510e00 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x390> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 510bd4 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x164> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1a228(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R15,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 510f40 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4d0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x19337(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511080 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x610> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x19fa5(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 510d14 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x2a4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1a0e8(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 5111c0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x750> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 510e54 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x3e4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x190c8(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511300 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x890> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x190ba(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511440 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x9d0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 510f94 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x524> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x19e68(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511580 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb10> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 5110d4 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x664> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 511218 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7a8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x18d08(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 5116c0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc50> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 511354 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8e4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x19aa8(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511800 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd90> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x19836(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 511494 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa24> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x19704(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 5115d8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb68> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x19828(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511940 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xed0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x195bf(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 511714 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xca4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 511858 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xde8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 511998 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xf28> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 259 |
nb uops | 278 |
loop length | 1503 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 7 |
micro-operation queue | 46.33 cycles |
front end | 46.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.07 | 10.33 | 10.33 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 10.33 |
cycles | 20.00 | 19.07 | 10.33 | 10.33 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 10.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 44.93 |
Stall cycles | 0.00 |
Front-end | 46.33 |
Dispatch | 20.00 |
Overall L1 | 46.33 |
all | 1% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 10% |
load | 5% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 4% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 10% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 13% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 50efa0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 50f060 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 510ad7 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x67> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x52150(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x53be7d,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x53de03,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51b970 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x53e799,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51e980 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 510ae5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 510b13 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x52114(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x53be7d,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x53e81c,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51b970 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x53e799,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51e980 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 510b22 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 510b55 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x520d7(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x53be7d,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x53e83e,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51b970 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x53e799,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 51e980 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD -0x38(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 510cc0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x250> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x1948c(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 510e00 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x390> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 510bd4 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x164> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1a228(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R15,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 510f40 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4d0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x19337(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511080 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x610> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x19fa5(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 510d14 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x2a4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1a0e8(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 5111c0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x750> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 510e54 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x3e4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x190c8(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511300 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x890> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x190ba(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511440 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x9d0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 510f94 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x524> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x19e68(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511580 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb10> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 5110d4 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x664> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 511218 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7a8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x18d08(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 5116c0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc50> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 511354 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8e4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x19aa8(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511800 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd90> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x19836(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 511494 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa24> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x19704(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 5115d8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb68> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x19828(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 511940 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xed0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x195bf(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 511714 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xca4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 511858 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xde8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 511a80 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x1010> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 511998 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xf28> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted– | 14.69 | 1.85 |
▼Loop 4321 - csr_matvec.c:248-341 - exec– | 1.08 | 0.11 |
○Loop 4322 - csr_matvec.c:337-339 - exec | 0.62 | 0.06 |
○Loop 4323 - csr_matvec.c:337-339 - exec | 0.17 | 0.02 |
▼Loop 4327 - csr_matvec.c:248-314 - exec– | 0.73 | 0.08 |
○Loop 4329 - csr_matvec.c:310-312 - exec | 5.17 | 0.54 |
○Loop 4328 - csr_matvec.c:310-312 - exec | 0.88 | 0.09 |
▼Loop 4339 - csr_matvec.c:248-263 - exec– | 0.63 | 0.07 |
○Loop 4341 - csr_matvec.c:259-261 - exec | 4.6 | 0.48 |
○Loop 4340 - csr_matvec.c:259-261 - exec | 0.81 | 0.08 |
▼Loop 4330 - csr_matvec.c:248-302 - exec– | 0 | 0 |
○Loop 4331 - csr_matvec.c:298-300 - exec | 0 | 0 |
○Loop 4332 - csr_matvec.c:298-300 - exec | 0 | 0 |
▼Loop 4324 - csr_matvec.c:248-326 - exec– | 0 | 0 |
○Loop 4325 - csr_matvec.c:322-324 - exec | 0 | 0 |
○Loop 4326 - csr_matvec.c:322-324 - exec | 0 | 0 |
▼Loop 4318 - csr_matvec.c:248-353 - exec– | 0 | 0 |
○Loop 4320 - csr_matvec.c:349-351 - exec | 0 | 0 |
○Loop 4319 - csr_matvec.c:349-351 - exec | 0 | 0 |
▼Loop 4306 - csr_matvec.c:248-404 - exec– | 0 | 0 |
○Loop 4308 - csr_matvec.c:400-402 - exec | 0 | 0 |
○Loop 4307 - csr_matvec.c:400-402 - exec | 0 | 0 |
▼Loop 4336 - csr_matvec.c:248-275 - exec– | 0 | 0 |
○Loop 4337 - csr_matvec.c:271-273 - exec | 0 | 0 |
○Loop 4338 - csr_matvec.c:271-273 - exec | 0 | 0 |
▼Loop 4309 - csr_matvec.c:248-392 - exec– | 0 | 0 |
○Loop 4310 - csr_matvec.c:388-390 - exec | 0 | 0 |
○Loop 4311 - csr_matvec.c:388-390 - exec | 0 | 0 |
▼Loop 4315 - csr_matvec.c:248-365 - exec– | 0 | 0 |
○Loop 4316 - csr_matvec.c:361-363 - exec | 0 | 0 |
○Loop 4317 - csr_matvec.c:361-363 - exec | 0 | 0 |
▼Loop 4312 - csr_matvec.c:248-380 - exec– | 0 | 0 |
○Loop 4314 - csr_matvec.c:376-378 - exec | 0 | 0 |
○Loop 4313 - csr_matvec.c:376-378 - exec | 0 | 0 |
▼Loop 4333 - csr_matvec.c:248-287 - exec– | 0 | 0 |
○Loop 4335 - csr_matvec.c:283-285 - exec | 0 | 0 |
○Loop 4334 - csr_matvec.c:283-285 - exec | 0 | 0 |