Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 16.57% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 16.57% |
---|
/scratch_na/users/xoserete/qaas_runs/171-172-8218/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
0x4ddbf0 PUSH %RBP |
0x4ddbf1 MOV %RSP,%RBP |
0x4ddbf4 PUSH %R15 |
0x4ddbf6 PUSH %R14 |
0x4ddbf8 PUSH %R13 |
0x4ddbfa PUSH %R12 |
0x4ddbfc PUSH %RBX |
0x4ddbfd SUB $0x18,%RSP |
0x4ddc01 MOV %R9,%RBX |
0x4ddc04 MOV %R8,%R14 |
0x4ddc07 MOV %RCX,%R12 |
0x4ddc0a MOV %RDX,-0x38(%RBP) |
0x4ddc0e MOV %RCX,%RDI |
0x4ddc11 CALL 4dc680 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> |
0x4ddc16 MOV %R12,%RDI |
0x4ddc19 MOV %RAX,%R12 |
0x4ddc1c CALL 4dc700 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> |
0x4ddc21 MOV %RAX,%R15 |
0x4ddc24 CMP %RAX,%R12 |
0x4ddc27 JLE 4ddc57 |
0x4ddc29 MOV 0x259f90(%RIP),%RDI |
0x4ddc30 MOV $0x510a05,%ESI |
0x4ddc35 MOV $0x512a2b,%EDX |
0x4ddc3a XOR %EAX,%EAX |
0x4ddc3c CALL 4e7000 <hypre_fprintf> |
0x4ddc41 MOV $0x5133d1,%EDI |
0x4ddc46 MOV $0xf8,%ESI |
0x4ddc4b MOV $0x1,%EDX |
0x4ddc50 XOR %ECX,%ECX |
0x4ddc52 CALL 4e9720 <hypre_error_handler> |
0x4ddc57 MOV 0x18(%RBP),%R13 |
0x4ddc5b TEST %R12,%R12 |
0x4ddc5e JS 4ddc65 |
0x4ddc60 CMP %R13,%R12 |
0x4ddc63 JLE 4ddc93 |
0x4ddc65 MOV 0x259f54(%RIP),%RDI |
0x4ddc6c MOV $0x510a05,%ESI |
0x4ddc71 MOV $0x513458,%EDX |
0x4ddc76 XOR %EAX,%EAX |
0x4ddc78 CALL 4e7000 <hypre_fprintf> |
0x4ddc7d MOV $0x5133d1,%EDI |
0x4ddc82 MOV $0xf9,%ESI |
0x4ddc87 MOV $0x1,%EDX |
0x4ddc8c XOR %ECX,%ECX |
0x4ddc8e CALL 4e9720 <hypre_error_handler> |
0x4ddc93 VMOVSD 0x38(%RBP),%XMM5 |
0x4ddc98 TEST %R15,%R15 |
0x4ddc9b JS 4ddca2 |
0x4ddc9d CMP %R13,%R15 |
0x4ddca0 JLE 4ddcd5 |
0x4ddca2 MOV 0x259f17(%RIP),%RDI |
0x4ddca9 MOV $0x510a05,%ESI |
0x4ddcae MOV $0x51347a,%EDX |
0x4ddcb3 XOR %EAX,%EAX |
0x4ddcb5 CALL 4e7000 <hypre_fprintf> |
0x4ddcba MOV $0x5133d1,%EDI |
0x4ddcbf MOV $0xfa,%ESI |
0x4ddcc4 MOV $0x1,%EDX |
0x4ddcc9 XOR %ECX,%ECX |
0x4ddccb CALL 4e9720 <hypre_error_handler> |
0x4ddcd0 VMOVSD 0x38(%RBP),%XMM5 |
0x4ddcd5 MOV 0x20(%RBP),%RCX |
0x4ddcd9 MOV 0x10(%RBP),%RDX |
0x4ddcdd VMOVSD -0x38(%RBP),%XMM0 |
0x4ddce2 VXORPD %XMM1,%XMM1,%XMM1 |
0x4ddce6 VUCOMISD %XMM1,%XMM5 |
0x4ddcea MOV %R12,-0x38(%RBP) |
0x4ddcee MOV %RBX,-0x30(%RBP) |
0x4ddcf2 JNE 4dddfc |
0x4ddcf8 VUCOMISD 0x20850(%RIP),%XMM0 |
0x4ddd00 JNE 4ddf1c |
0x4ddd06 CMP %R15,%R12 |
0x4ddd09 JGE 4de95c |
0x4ddd0f MOV %R12,%RAX |
0x4ddd12 NOT %RAX |
0x4ddd15 ADD %RAX,%R15 |
0x4ddd18 XOR %ESI,%ESI |
0x4ddd1a JMP 4ddd39 |
0x4ddd1c NOPL (%RAX) |
(4312) 0x4ddd20 MOV 0x30(%RBP),%RAX |
(4312) 0x4ddd24 VMOVSD %XMM0,(%RAX,%RDI,8) |
(4312) 0x4ddd29 LEA 0x1(%RSI),%RAX |
(4312) 0x4ddd2d CMP %R15,%RSI |
(4312) 0x4ddd30 MOV %RAX,%RSI |
(4312) 0x4ddd33 JE 4de95c |
(4312) 0x4ddd39 LEA (%R12,%RSI,1),%RDI |
(4312) 0x4ddd3d MOV (%RBX,%RDI,8),%R10 |
(4312) 0x4ddd41 MOV 0x8(%RBX,%RDI,8),%R8 |
(4312) 0x4ddd46 VXORPD %XMM0,%XMM0,%XMM0 |
(4312) 0x4ddd4a MOV %R8,%R11 |
(4312) 0x4ddd4d SUB %R10,%R11 |
(4312) 0x4ddd50 JLE 4ddd20 |
(4312) 0x4ddd52 MOV %R11,%R9 |
(4312) 0x4ddd55 AND $-0x4,%R9 |
(4312) 0x4ddd59 JE 4dddce |
(4312) 0x4ddd5b MOV %R15,%RBX |
(4312) 0x4ddd5e LEA -0x1(%R9),%R15 |
(4312) 0x4ddd62 LEA (%R14,%R10,8),%R13 |
(4312) 0x4ddd66 LEA (%RDX,%R10,8),%RAX |
(4312) 0x4ddd6a VXORPD %XMM0,%XMM0,%XMM0 |
(4312) 0x4ddd6e XOR %R12D,%R12D |
(4312) 0x4ddd71 NOPW %CS:(%RAX,%RAX,1) |
(4314) 0x4ddd80 VMOVUPD (%RAX,%R12,8),%YMM1 |
(4314) 0x4ddd86 KXNORW %K0,%K0,%K1 |
(4314) 0x4ddd8a VXORPD %XMM2,%XMM2,%XMM2 |
(4314) 0x4ddd8e VGATHERQPD (%RCX,%YMM1,8),%YMM2{%K1} |
(4314) 0x4ddd95 VFMADD231PD (%R13,%R12,8),%YMM2,%YMM0 |
(4314) 0x4ddd9c ADD $0x4,%R12 |
(4314) 0x4ddda0 CMP %R15,%R12 |
(4314) 0x4ddda3 JBE 4ddd80 |
(4312) 0x4ddda5 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(4312) 0x4dddab VADDPD %XMM1,%XMM0,%XMM0 |
(4312) 0x4dddaf VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(4312) 0x4dddb4 VADDSD %XMM1,%XMM0,%XMM0 |
(4312) 0x4dddb8 CMP %R9,%R11 |
(4312) 0x4dddbb MOV -0x38(%RBP),%R12 |
(4312) 0x4dddbf MOV %RBX,%R15 |
(4312) 0x4dddc2 MOV -0x30(%RBP),%RBX |
(4312) 0x4dddc6 JE 4ddd20 |
(4312) 0x4dddcc JMP 4dddd1 |
(4312) 0x4dddce XOR %R9D,%R9D |
(4312) 0x4dddd1 ADD %R10,%R9 |
(4312) 0x4dddd4 NOPW %CS:(%RAX,%RAX,1) |
(4313) 0x4ddde0 MOV (%RDX,%R9,8),%RAX |
(4313) 0x4ddde4 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4313) 0x4ddde9 VFMADD231SD (%R14,%R9,8),%XMM1,%XMM0 |
(4313) 0x4dddef INC %R9 |
(4313) 0x4dddf2 CMP %R9,%R8 |
(4313) 0x4dddf5 JNE 4ddde0 |
(4312) 0x4dddf7 JMP 4ddd20 |
0x4dddfc VUCOMISD 0x2160c(%RIP),%XMM5 |
0x4dde04 MOV %R15,%RSI |
0x4dde07 JNE 4de01c |
0x4dde0d VUCOMISD 0x2073b(%RIP),%XMM0 |
0x4dde15 JNE 4de13c |
0x4dde1b CMP %RSI,%R12 |
0x4dde1e MOV 0x28(%RBP),%R15 |
0x4dde22 JGE 4de95c |
0x4dde28 MOV %R12,%RAX |
0x4dde2b NOT %RAX |
0x4dde2e ADD %RAX,%RSI |
0x4dde31 XOR %EDI,%EDI |
0x4dde33 VMOVDDUP 0x21385(%RIP),%XMM0 |
0x4dde3b JMP 4dde5a |
0x4dde3d NOPL (%RAX) |
(4303) 0x4dde40 MOV 0x30(%RBP),%RAX |
(4303) 0x4dde44 VMOVSD %XMM1,(%RAX,%R8,8) |
(4303) 0x4dde4a LEA 0x1(%RDI),%RAX |
(4303) 0x4dde4e CMP %RSI,%RDI |
(4303) 0x4dde51 MOV %RAX,%RDI |
(4303) 0x4dde54 JE 4de95c |
(4303) 0x4dde5a LEA (%R12,%RDI,1),%R8 |
(4303) 0x4dde5e VMOVSD (%R15,%R8,8),%XMM1 |
(4303) 0x4dde64 VXORPD %XMM0,%XMM1,%XMM1 |
(4303) 0x4dde68 MOV (%RBX,%R8,8),%R11 |
(4303) 0x4dde6c MOV 0x8(%RBX,%R8,8),%R9 |
(4303) 0x4dde71 MOV %R9,%R13 |
(4303) 0x4dde74 SUB %R11,%R13 |
(4303) 0x4dde77 JLE 4dde40 |
(4303) 0x4dde79 MOV %R13,%R10 |
(4303) 0x4dde7c AND $-0x4,%R10 |
(4303) 0x4dde80 JE 4ddef5 |
(4303) 0x4dde82 MOV %RSI,%RBX |
(4303) 0x4dde85 LEA -0x1(%R10),%R15 |
(4303) 0x4dde89 LEA (%R14,%R11,8),%RSI |
(4303) 0x4dde8d LEA (%RDX,%R11,8),%RAX |
(4303) 0x4dde91 VXORPD %XMM2,%XMM2,%XMM2 |
(4303) 0x4dde95 XOR %R12D,%R12D |
(4303) 0x4dde98 NOPL (%RAX,%RAX,1) |
(4305) 0x4ddea0 VMOVUPD (%RAX,%R12,8),%YMM3 |
(4305) 0x4ddea6 KXNORW %K0,%K0,%K1 |
(4305) 0x4ddeaa VXORPD %XMM4,%XMM4,%XMM4 |
(4305) 0x4ddeae VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4305) 0x4ddeb5 VFMADD231PD (%RSI,%R12,8),%YMM4,%YMM2 |
(4305) 0x4ddebb ADD $0x4,%R12 |
(4305) 0x4ddebf CMP %R15,%R12 |
(4305) 0x4ddec2 JBE 4ddea0 |
(4303) 0x4ddec4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4303) 0x4ddeca VADDPD %XMM3,%XMM2,%XMM2 |
(4303) 0x4ddece VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4303) 0x4dded3 VADDSD %XMM3,%XMM2,%XMM2 |
(4303) 0x4dded7 VADDSD %XMM2,%XMM1,%XMM1 |
(4303) 0x4ddedb CMP %R10,%R13 |
(4303) 0x4ddede MOV -0x38(%RBP),%R12 |
(4303) 0x4ddee2 MOV %RBX,%RSI |
(4303) 0x4ddee5 MOV -0x30(%RBP),%RBX |
(4303) 0x4ddee9 MOV 0x28(%RBP),%R15 |
(4303) 0x4ddeed JE 4dde40 |
(4303) 0x4ddef3 JMP 4ddef8 |
(4303) 0x4ddef5 XOR %R10D,%R10D |
(4303) 0x4ddef8 ADD %R11,%R10 |
(4303) 0x4ddefb NOPL (%RAX,%RAX,1) |
(4304) 0x4ddf00 MOV (%RDX,%R10,8),%RAX |
(4304) 0x4ddf04 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4304) 0x4ddf09 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4304) 0x4ddf0f INC %R10 |
(4304) 0x4ddf12 CMP %R10,%R9 |
(4304) 0x4ddf15 JNE 4ddf00 |
(4303) 0x4ddf17 JMP 4dde40 |
0x4ddf1c VUCOMISD 0x214ec(%RIP),%XMM0 |
0x4ddf24 JNE 4de24c |
0x4ddf2a CMP %R15,%R12 |
0x4ddf2d JGE 4de95c |
0x4ddf33 MOV %R12,%RAX |
0x4ddf36 NOT %RAX |
0x4ddf39 ADD %RAX,%R15 |
0x4ddf3c XOR %ESI,%ESI |
0x4ddf3e JMP 4ddf59 |
(4309) 0x4ddf40 MOV 0x30(%RBP),%RAX |
(4309) 0x4ddf44 VMOVSD %XMM0,(%RAX,%RDI,8) |
(4309) 0x4ddf49 LEA 0x1(%RSI),%RAX |
(4309) 0x4ddf4d CMP %R15,%RSI |
(4309) 0x4ddf50 MOV %RAX,%RSI |
(4309) 0x4ddf53 JE 4de95c |
(4309) 0x4ddf59 LEA (%R12,%RSI,1),%RDI |
(4309) 0x4ddf5d MOV (%RBX,%RDI,8),%R10 |
(4309) 0x4ddf61 MOV 0x8(%RBX,%RDI,8),%R8 |
(4309) 0x4ddf66 VXORPD %XMM0,%XMM0,%XMM0 |
(4309) 0x4ddf6a MOV %R8,%R11 |
(4309) 0x4ddf6d SUB %R10,%R11 |
(4309) 0x4ddf70 JLE 4ddf40 |
(4309) 0x4ddf72 MOV %R11,%R9 |
(4309) 0x4ddf75 AND $-0x4,%R9 |
(4309) 0x4ddf79 JE 4ddfee |
(4309) 0x4ddf7b MOV %R15,%RBX |
(4309) 0x4ddf7e LEA -0x1(%R9),%R15 |
(4309) 0x4ddf82 LEA (%R14,%R10,8),%R13 |
(4309) 0x4ddf86 LEA (%RDX,%R10,8),%RAX |
(4309) 0x4ddf8a VXORPD %XMM0,%XMM0,%XMM0 |
(4309) 0x4ddf8e XOR %R12D,%R12D |
(4309) 0x4ddf91 NOPW %CS:(%RAX,%RAX,1) |
(4311) 0x4ddfa0 VMOVUPD (%RAX,%R12,8),%YMM1 |
(4311) 0x4ddfa6 VXORPD %XMM2,%XMM2,%XMM2 |
(4311) 0x4ddfaa KXNORW %K0,%K0,%K1 |
(4311) 0x4ddfae VGATHERQPD (%RCX,%YMM1,8),%YMM2{%K1} |
(4311) 0x4ddfb5 VFNMADD231PD (%R13,%R12,8),%YMM2,%YMM0 |
(4311) 0x4ddfbc ADD $0x4,%R12 |
(4311) 0x4ddfc0 CMP %R15,%R12 |
(4311) 0x4ddfc3 JBE 4ddfa0 |
(4309) 0x4ddfc5 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(4309) 0x4ddfcb VADDPD %XMM1,%XMM0,%XMM0 |
(4309) 0x4ddfcf VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(4309) 0x4ddfd4 VADDSD %XMM1,%XMM0,%XMM0 |
(4309) 0x4ddfd8 CMP %R9,%R11 |
(4309) 0x4ddfdb MOV -0x38(%RBP),%R12 |
(4309) 0x4ddfdf MOV %RBX,%R15 |
(4309) 0x4ddfe2 MOV -0x30(%RBP),%RBX |
(4309) 0x4ddfe6 JE 4ddf40 |
(4309) 0x4ddfec JMP 4ddff1 |
(4309) 0x4ddfee XOR %R9D,%R9D |
(4309) 0x4ddff1 ADD %R10,%R9 |
(4309) 0x4ddff4 NOPW %CS:(%RAX,%RAX,1) |
(4310) 0x4de000 MOV (%RDX,%R9,8),%RAX |
(4310) 0x4de004 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4310) 0x4de009 VFNMADD231SD (%R14,%R9,8),%XMM1,%XMM0 |
(4310) 0x4de00f INC %R9 |
(4310) 0x4de012 CMP %R9,%R8 |
(4310) 0x4de015 JNE 4de000 |
(4309) 0x4de017 JMP 4ddf40 |
0x4de01c VUCOMISD 0x2052c(%RIP),%XMM5 |
0x4de024 JNE 4de34c |
0x4de02a VUCOMISD 0x2051e(%RIP),%XMM0 |
0x4de032 JNE 4de45c |
0x4de038 CMP %RSI,%R12 |
0x4de03b MOV 0x28(%RBP),%R15 |
0x4de03f JGE 4de95c |
0x4de045 MOV %R12,%RAX |
0x4de048 NOT %RAX |
0x4de04b ADD %RAX,%RSI |
0x4de04e XOR %EDI,%EDI |
0x4de050 MOV %RSI,-0x30(%RBP) |
0x4de054 JMP 4de07a |
0x4de056 NOPW %CS:(%RAX,%RAX,1) |
(4294) 0x4de060 MOV 0x30(%RBP),%RAX |
(4294) 0x4de064 VMOVSD %XMM0,(%RAX,%R8,8) |
(4294) 0x4de06a LEA 0x1(%RDI),%RAX |
(4294) 0x4de06e CMP %RSI,%RDI |
(4294) 0x4de071 MOV %RAX,%RDI |
(4294) 0x4de074 JE 4de95c |
(4294) 0x4de07a LEA (%R12,%RDI,1),%R8 |
(4294) 0x4de07e VMOVSD (%R15,%R8,8),%XMM0 |
(4294) 0x4de084 MOV (%RBX,%R8,8),%R11 |
(4294) 0x4de088 MOV 0x8(%RBX,%R8,8),%R9 |
(4294) 0x4de08d MOV %R9,%R13 |
(4294) 0x4de090 SUB %R11,%R13 |
(4294) 0x4de093 JLE 4de060 |
(4294) 0x4de095 MOV %R13,%R10 |
(4294) 0x4de098 AND $-0x4,%R10 |
(4294) 0x4de09c JE 4de112 |
(4294) 0x4de09e LEA -0x1(%R10),%R15 |
(4294) 0x4de0a2 LEA (%R14,%R11,8),%RSI |
(4294) 0x4de0a6 LEA (%RDX,%R11,8),%RAX |
(4294) 0x4de0aa VXORPD %XMM1,%XMM1,%XMM1 |
(4294) 0x4de0ae XOR %R12D,%R12D |
(4294) 0x4de0b1 NOPW %CS:(%RAX,%RAX,1) |
(4296) 0x4de0c0 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4296) 0x4de0c6 VXORPD %XMM3,%XMM3,%XMM3 |
(4296) 0x4de0ca KXNORW %K0,%K0,%K1 |
(4296) 0x4de0ce VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4296) 0x4de0d5 VFMADD231PD (%RSI,%R12,8),%YMM3,%YMM1 |
(4296) 0x4de0db ADD $0x4,%R12 |
(4296) 0x4de0df CMP %R15,%R12 |
(4296) 0x4de0e2 JBE 4de0c0 |
(4294) 0x4de0e4 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4294) 0x4de0ea VADDPD %XMM2,%XMM1,%XMM1 |
(4294) 0x4de0ee VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4294) 0x4de0f3 VADDSD %XMM2,%XMM1,%XMM1 |
(4294) 0x4de0f7 VADDSD %XMM1,%XMM0,%XMM0 |
(4294) 0x4de0fb CMP %R10,%R13 |
(4294) 0x4de0fe MOV -0x38(%RBP),%R12 |
(4294) 0x4de102 MOV -0x30(%RBP),%RSI |
(4294) 0x4de106 MOV 0x28(%RBP),%R15 |
(4294) 0x4de10a JE 4de060 |
(4294) 0x4de110 JMP 4de115 |
(4294) 0x4de112 XOR %R10D,%R10D |
(4294) 0x4de115 ADD %R11,%R10 |
(4294) 0x4de118 NOPL (%RAX,%RAX,1) |
(4295) 0x4de120 MOV (%RDX,%R10,8),%RAX |
(4295) 0x4de124 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4295) 0x4de129 VFMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(4295) 0x4de12f INC %R10 |
(4295) 0x4de132 CMP %R10,%R9 |
(4295) 0x4de135 JNE 4de120 |
(4294) 0x4de137 JMP 4de060 |
0x4de13c VUCOMISD 0x212cc(%RIP),%XMM0 |
0x4de144 MOV 0x28(%RBP),%R15 |
0x4de148 JNE 4de56c |
0x4de14e CMP %RSI,%R12 |
0x4de151 JGE 4de95c |
0x4de157 MOV %R12,%RAX |
0x4de15a NOT %RAX |
0x4de15d ADD %RAX,%RSI |
0x4de160 XOR %EDI,%EDI |
0x4de162 MOV %RSI,-0x30(%RBP) |
0x4de166 JMP 4de18a |
0x4de168 NOPL (%RAX,%RAX,1) |
(4300) 0x4de170 MOV 0x30(%RBP),%RAX |
(4300) 0x4de174 VMOVSD %XMM0,(%RAX,%R8,8) |
(4300) 0x4de17a LEA 0x1(%RDI),%RAX |
(4300) 0x4de17e CMP %RSI,%RDI |
(4300) 0x4de181 MOV %RAX,%RDI |
(4300) 0x4de184 JE 4de95c |
(4300) 0x4de18a LEA (%R12,%RDI,1),%R8 |
(4300) 0x4de18e VMOVSD (%R15,%R8,8),%XMM0 |
(4300) 0x4de194 MOV (%RBX,%R8,8),%R11 |
(4300) 0x4de198 MOV 0x8(%RBX,%R8,8),%R9 |
(4300) 0x4de19d MOV %R9,%R13 |
(4300) 0x4de1a0 SUB %R11,%R13 |
(4300) 0x4de1a3 JLE 4de170 |
(4300) 0x4de1a5 MOV %R13,%R10 |
(4300) 0x4de1a8 AND $-0x4,%R10 |
(4300) 0x4de1ac JE 4de222 |
(4300) 0x4de1ae LEA -0x1(%R10),%R15 |
(4300) 0x4de1b2 LEA (%R14,%R11,8),%RSI |
(4300) 0x4de1b6 LEA (%RDX,%R11,8),%RAX |
(4300) 0x4de1ba VXORPD %XMM1,%XMM1,%XMM1 |
(4300) 0x4de1be XOR %R12D,%R12D |
(4300) 0x4de1c1 NOPW %CS:(%RAX,%RAX,1) |
(4302) 0x4de1d0 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4302) 0x4de1d6 KXNORW %K0,%K0,%K1 |
(4302) 0x4de1da VXORPD %XMM3,%XMM3,%XMM3 |
(4302) 0x4de1de VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4302) 0x4de1e5 VFNMADD231PD (%RSI,%R12,8),%YMM3,%YMM1 |
(4302) 0x4de1eb ADD $0x4,%R12 |
(4302) 0x4de1ef CMP %R15,%R12 |
(4302) 0x4de1f2 JBE 4de1d0 |
(4300) 0x4de1f4 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4300) 0x4de1fa VADDPD %XMM2,%XMM1,%XMM1 |
(4300) 0x4de1fe VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4300) 0x4de203 VADDSD %XMM2,%XMM1,%XMM1 |
(4300) 0x4de207 VADDSD %XMM1,%XMM0,%XMM0 |
(4300) 0x4de20b CMP %R10,%R13 |
(4300) 0x4de20e MOV -0x38(%RBP),%R12 |
(4300) 0x4de212 MOV -0x30(%RBP),%RSI |
(4300) 0x4de216 MOV 0x28(%RBP),%R15 |
(4300) 0x4de21a JE 4de170 |
(4300) 0x4de220 JMP 4de225 |
(4300) 0x4de222 XOR %R10D,%R10D |
(4300) 0x4de225 ADD %R11,%R10 |
(4300) 0x4de228 NOPL (%RAX,%RAX,1) |
(4301) 0x4de230 MOV (%RDX,%R10,8),%RAX |
(4301) 0x4de234 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4301) 0x4de239 VFNMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(4301) 0x4de23f INC %R10 |
(4301) 0x4de242 CMP %R10,%R9 |
(4301) 0x4de245 JNE 4de230 |
(4300) 0x4de247 JMP 4de170 |
0x4de24c CMP %R15,%R12 |
0x4de24f JGE 4de95c |
0x4de255 MOV %R12,%RAX |
0x4de258 NOT %RAX |
0x4de25b ADD %RAX,%R15 |
0x4de25e XOR %ESI,%ESI |
0x4de260 JMP 4de28d |
0x4de262 NOPW %CS:(%RAX,%RAX,1) |
(4306) 0x4de270 VMULSD %XMM0,%XMM1,%XMM1 |
(4306) 0x4de274 MOV 0x30(%RBP),%RAX |
(4306) 0x4de278 VMOVSD %XMM1,(%RAX,%RDI,8) |
(4306) 0x4de27d LEA 0x1(%RSI),%RAX |
(4306) 0x4de281 CMP %R15,%RSI |
(4306) 0x4de284 MOV %RAX,%RSI |
(4306) 0x4de287 JE 4de95c |
(4306) 0x4de28d LEA (%R12,%RSI,1),%RDI |
(4306) 0x4de291 MOV (%RBX,%RDI,8),%R10 |
(4306) 0x4de295 MOV 0x8(%RBX,%RDI,8),%R8 |
(4306) 0x4de29a VXORPD %XMM1,%XMM1,%XMM1 |
(4306) 0x4de29e MOV %R8,%R11 |
(4306) 0x4de2a1 SUB %R10,%R11 |
(4306) 0x4de2a4 JLE 4de270 |
(4306) 0x4de2a6 MOV %R11,%R9 |
(4306) 0x4de2a9 AND $-0x4,%R9 |
(4306) 0x4de2ad JE 4de31e |
(4306) 0x4de2af MOV %R15,%RBX |
(4306) 0x4de2b2 LEA -0x1(%R9),%R15 |
(4306) 0x4de2b6 LEA (%R14,%R10,8),%R13 |
(4306) 0x4de2ba LEA (%RDX,%R10,8),%RAX |
(4306) 0x4de2be VXORPD %XMM1,%XMM1,%XMM1 |
(4306) 0x4de2c2 XOR %R12D,%R12D |
(4306) 0x4de2c5 NOPW %CS:(%RAX,%RAX,1) |
(4308) 0x4de2d0 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4308) 0x4de2d6 VXORPD %XMM3,%XMM3,%XMM3 |
(4308) 0x4de2da KXNORW %K0,%K0,%K1 |
(4308) 0x4de2de VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4308) 0x4de2e5 VFMADD231PD (%R13,%R12,8),%YMM3,%YMM1 |
(4308) 0x4de2ec ADD $0x4,%R12 |
(4308) 0x4de2f0 CMP %R15,%R12 |
(4308) 0x4de2f3 JBE 4de2d0 |
(4306) 0x4de2f5 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4306) 0x4de2fb VADDPD %XMM2,%XMM1,%XMM1 |
(4306) 0x4de2ff VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4306) 0x4de304 VADDSD %XMM2,%XMM1,%XMM1 |
(4306) 0x4de308 CMP %R9,%R11 |
(4306) 0x4de30b MOV -0x38(%RBP),%R12 |
(4306) 0x4de30f MOV %RBX,%R15 |
(4306) 0x4de312 MOV -0x30(%RBP),%RBX |
(4306) 0x4de316 JE 4de270 |
(4306) 0x4de31c JMP 4de321 |
(4306) 0x4de31e XOR %R9D,%R9D |
(4306) 0x4de321 ADD %R10,%R9 |
(4306) 0x4de324 NOPW %CS:(%RAX,%RAX,1) |
(4307) 0x4de330 MOV (%RDX,%R9,8),%RAX |
(4307) 0x4de334 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4307) 0x4de339 VFMADD231SD (%R14,%R9,8),%XMM2,%XMM1 |
(4307) 0x4de33f INC %R9 |
(4307) 0x4de342 CMP %R9,%R8 |
(4307) 0x4de345 JNE 4de330 |
(4306) 0x4de347 JMP 4de270 |
0x4de34c VUCOMISD 0x201fc(%RIP),%XMM0 |
0x4de354 JNE 4de66c |
0x4de35a CMP %RSI,%R12 |
0x4de35d MOV 0x28(%RBP),%R15 |
0x4de361 JGE 4de95c |
0x4de367 MOV %R12,%RAX |
0x4de36a NOT %RAX |
0x4de36d ADD %RAX,%RSI |
0x4de370 XOR %EDI,%EDI |
0x4de372 MOV %RSI,-0x30(%RBP) |
0x4de376 JMP 4de39a |
0x4de378 NOPL (%RAX,%RAX,1) |
(4285) 0x4de380 MOV 0x30(%RBP),%RAX |
(4285) 0x4de384 VMOVSD %XMM0,(%RAX,%R8,8) |
(4285) 0x4de38a LEA 0x1(%RDI),%RAX |
(4285) 0x4de38e CMP %RSI,%RDI |
(4285) 0x4de391 MOV %RAX,%RDI |
(4285) 0x4de394 JE 4de95c |
(4285) 0x4de39a LEA (%R12,%RDI,1),%R8 |
(4285) 0x4de39e VMULSD (%R15,%R8,8),%XMM5,%XMM0 |
(4285) 0x4de3a4 MOV (%RBX,%R8,8),%R11 |
(4285) 0x4de3a8 MOV 0x8(%RBX,%R8,8),%R9 |
(4285) 0x4de3ad MOV %R9,%R13 |
(4285) 0x4de3b0 SUB %R11,%R13 |
(4285) 0x4de3b3 JLE 4de380 |
(4285) 0x4de3b5 MOV %R13,%R10 |
(4285) 0x4de3b8 AND $-0x4,%R10 |
(4285) 0x4de3bc JE 4de432 |
(4285) 0x4de3be LEA -0x1(%R10),%R15 |
(4285) 0x4de3c2 LEA (%R14,%R11,8),%RSI |
(4285) 0x4de3c6 LEA (%RDX,%R11,8),%RAX |
(4285) 0x4de3ca VXORPD %XMM1,%XMM1,%XMM1 |
(4285) 0x4de3ce XOR %R12D,%R12D |
(4285) 0x4de3d1 NOPW %CS:(%RAX,%RAX,1) |
(4287) 0x4de3e0 VMOVUPD (%RAX,%R12,8),%YMM2 |
(4287) 0x4de3e6 KXNORW %K0,%K0,%K1 |
(4287) 0x4de3ea VXORPD %XMM3,%XMM3,%XMM3 |
(4287) 0x4de3ee VGATHERQPD (%RCX,%YMM2,8),%YMM3{%K1} |
(4287) 0x4de3f5 VFMADD231PD (%RSI,%R12,8),%YMM3,%YMM1 |
(4287) 0x4de3fb ADD $0x4,%R12 |
(4287) 0x4de3ff CMP %R15,%R12 |
(4287) 0x4de402 JBE 4de3e0 |
(4285) 0x4de404 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4285) 0x4de40a VADDPD %XMM2,%XMM1,%XMM1 |
(4285) 0x4de40e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4285) 0x4de413 VADDSD %XMM2,%XMM1,%XMM1 |
(4285) 0x4de417 VADDSD %XMM1,%XMM0,%XMM0 |
(4285) 0x4de41b CMP %R10,%R13 |
(4285) 0x4de41e MOV -0x38(%RBP),%R12 |
(4285) 0x4de422 MOV -0x30(%RBP),%RSI |
(4285) 0x4de426 MOV 0x28(%RBP),%R15 |
(4285) 0x4de42a JE 4de380 |
(4285) 0x4de430 JMP 4de435 |
(4285) 0x4de432 XOR %R10D,%R10D |
(4285) 0x4de435 ADD %R11,%R10 |
(4285) 0x4de438 NOPL (%RAX,%RAX,1) |
(4286) 0x4de440 MOV (%RDX,%R10,8),%RAX |
(4286) 0x4de444 VMOVSD (%RCX,%RAX,8),%XMM1 |
(4286) 0x4de449 VFMADD231SD (%R14,%R10,8),%XMM1,%XMM0 |
(4286) 0x4de44f INC %R10 |
(4286) 0x4de452 CMP %R10,%R9 |
(4286) 0x4de455 JNE 4de440 |
(4285) 0x4de457 JMP 4de380 |
0x4de45c VUCOMISD 0x20fac(%RIP),%XMM0 |
0x4de464 MOV 0x28(%RBP),%R15 |
0x4de468 JNE 4de77c |
0x4de46e CMP %RSI,%R12 |
0x4de471 JGE 4de95c |
0x4de477 MOV %R12,%RAX |
0x4de47a NOT %RAX |
0x4de47d ADD %RAX,%RSI |
0x4de480 XOR %EDI,%EDI |
0x4de482 VMOVDDUP 0x20d36(%RIP),%XMM0 |
0x4de48a MOV %RSI,-0x30(%RBP) |
0x4de48e JMP 4de4aa |
(4291) 0x4de490 MOV 0x30(%RBP),%RAX |
(4291) 0x4de494 VMOVSD %XMM1,(%RAX,%R8,8) |
(4291) 0x4de49a LEA 0x1(%RDI),%RAX |
(4291) 0x4de49e CMP %RSI,%RDI |
(4291) 0x4de4a1 MOV %RAX,%RDI |
(4291) 0x4de4a4 JE 4de95c |
(4291) 0x4de4aa LEA (%R12,%RDI,1),%R8 |
(4291) 0x4de4ae VMOVSD (%R15,%R8,8),%XMM1 |
(4291) 0x4de4b4 VXORPD %XMM0,%XMM1,%XMM1 |
(4291) 0x4de4b8 MOV (%RBX,%R8,8),%R11 |
(4291) 0x4de4bc MOV 0x8(%RBX,%R8,8),%R9 |
(4291) 0x4de4c1 MOV %R9,%R13 |
(4291) 0x4de4c4 SUB %R11,%R13 |
(4291) 0x4de4c7 JLE 4de490 |
(4291) 0x4de4c9 MOV %R13,%R10 |
(4291) 0x4de4cc AND $-0x4,%R10 |
(4291) 0x4de4d0 JE 4de542 |
(4291) 0x4de4d2 LEA -0x1(%R10),%R15 |
(4291) 0x4de4d6 LEA (%R14,%R11,8),%RSI |
(4291) 0x4de4da LEA (%RDX,%R11,8),%RAX |
(4291) 0x4de4de VXORPD %XMM2,%XMM2,%XMM2 |
(4291) 0x4de4e2 XOR %R12D,%R12D |
(4291) 0x4de4e5 NOPW %CS:(%RAX,%RAX,1) |
(4293) 0x4de4f0 VMOVUPD (%RAX,%R12,8),%YMM3 |
(4293) 0x4de4f6 VXORPD %XMM4,%XMM4,%XMM4 |
(4293) 0x4de4fa KXNORW %K0,%K0,%K1 |
(4293) 0x4de4fe VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4293) 0x4de505 VFNMADD231PD (%RSI,%R12,8),%YMM4,%YMM2 |
(4293) 0x4de50b ADD $0x4,%R12 |
(4293) 0x4de50f CMP %R15,%R12 |
(4293) 0x4de512 JBE 4de4f0 |
(4291) 0x4de514 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4291) 0x4de51a VADDPD %XMM3,%XMM2,%XMM2 |
(4291) 0x4de51e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4291) 0x4de523 VADDSD %XMM3,%XMM2,%XMM2 |
(4291) 0x4de527 VADDSD %XMM2,%XMM1,%XMM1 |
(4291) 0x4de52b CMP %R10,%R13 |
(4291) 0x4de52e MOV -0x38(%RBP),%R12 |
(4291) 0x4de532 MOV -0x30(%RBP),%RSI |
(4291) 0x4de536 MOV 0x28(%RBP),%R15 |
(4291) 0x4de53a JE 4de490 |
(4291) 0x4de540 JMP 4de545 |
(4291) 0x4de542 XOR %R10D,%R10D |
(4291) 0x4de545 ADD %R11,%R10 |
(4291) 0x4de548 NOPL (%RAX,%RAX,1) |
(4292) 0x4de550 MOV (%RDX,%R10,8),%RAX |
(4292) 0x4de554 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4292) 0x4de559 VFNMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4292) 0x4de55f INC %R10 |
(4292) 0x4de562 CMP %R10,%R9 |
(4292) 0x4de565 JNE 4de550 |
(4291) 0x4de567 JMP 4de490 |
0x4de56c CMP %RSI,%R12 |
0x4de56f JGE 4de95c |
0x4de575 MOV %R12,%RAX |
0x4de578 NOT %RAX |
0x4de57b ADD %RAX,%RSI |
0x4de57e XOR %EDI,%EDI |
0x4de580 VMOVDDUP 0x20c38(%RIP),%XMM1 |
0x4de588 MOV %RSI,-0x30(%RBP) |
0x4de58c JMP 4de5ae |
0x4de58e XCHG %AX,%AX |
(4297) 0x4de590 VMULSD %XMM0,%XMM2,%XMM2 |
(4297) 0x4de594 MOV 0x30(%RBP),%RAX |
(4297) 0x4de598 VMOVSD %XMM2,(%RAX,%R8,8) |
(4297) 0x4de59e LEA 0x1(%RDI),%RAX |
(4297) 0x4de5a2 CMP %RSI,%RDI |
(4297) 0x4de5a5 MOV %RAX,%RDI |
(4297) 0x4de5a8 JE 4de95c |
(4297) 0x4de5ae LEA (%R12,%RDI,1),%R8 |
(4297) 0x4de5b2 VMOVSD (%R15,%R8,8),%XMM2 |
(4297) 0x4de5b8 VXORPD %XMM1,%XMM2,%XMM2 |
(4297) 0x4de5bc MOV (%RBX,%R8,8),%R11 |
(4297) 0x4de5c0 MOV 0x8(%RBX,%R8,8),%R9 |
(4297) 0x4de5c5 MOV %R9,%R13 |
(4297) 0x4de5c8 SUB %R11,%R13 |
(4297) 0x4de5cb JLE 4de590 |
(4297) 0x4de5cd MOV %R13,%R10 |
(4297) 0x4de5d0 AND $-0x4,%R10 |
(4297) 0x4de5d4 JE 4de642 |
(4297) 0x4de5d6 LEA -0x1(%R10),%R15 |
(4297) 0x4de5da LEA (%R14,%R11,8),%RSI |
(4297) 0x4de5de LEA (%RDX,%R11,8),%RAX |
(4297) 0x4de5e2 VXORPD %XMM3,%XMM3,%XMM3 |
(4297) 0x4de5e6 XOR %R12D,%R12D |
(4297) 0x4de5e9 NOPL (%RAX) |
(4299) 0x4de5f0 VMOVUPD (%RAX,%R12,8),%YMM4 |
(4299) 0x4de5f6 VXORPD %XMM5,%XMM5,%XMM5 |
(4299) 0x4de5fa KXNORW %K0,%K0,%K1 |
(4299) 0x4de5fe VGATHERQPD (%RCX,%YMM4,8),%YMM5{%K1} |
(4299) 0x4de605 VFMADD231PD (%RSI,%R12,8),%YMM5,%YMM3 |
(4299) 0x4de60b ADD $0x4,%R12 |
(4299) 0x4de60f CMP %R15,%R12 |
(4299) 0x4de612 JBE 4de5f0 |
(4297) 0x4de614 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(4297) 0x4de61a VADDPD %XMM4,%XMM3,%XMM3 |
(4297) 0x4de61e VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(4297) 0x4de623 VADDSD %XMM4,%XMM3,%XMM3 |
(4297) 0x4de627 VADDSD %XMM3,%XMM2,%XMM2 |
(4297) 0x4de62b CMP %R10,%R13 |
(4297) 0x4de62e MOV -0x38(%RBP),%R12 |
(4297) 0x4de632 MOV -0x30(%RBP),%RSI |
(4297) 0x4de636 MOV 0x28(%RBP),%R15 |
(4297) 0x4de63a JE 4de590 |
(4297) 0x4de640 JMP 4de645 |
(4297) 0x4de642 XOR %R10D,%R10D |
(4297) 0x4de645 ADD %R11,%R10 |
(4297) 0x4de648 NOPL (%RAX,%RAX,1) |
(4298) 0x4de650 MOV (%RDX,%R10,8),%RAX |
(4298) 0x4de654 VMOVSD (%RCX,%RAX,8),%XMM3 |
(4298) 0x4de659 VFMADD231SD (%R14,%R10,8),%XMM3,%XMM2 |
(4298) 0x4de65f INC %R10 |
(4298) 0x4de662 CMP %R10,%R9 |
(4298) 0x4de665 JNE 4de650 |
(4297) 0x4de667 JMP 4de590 |
0x4de66c VUCOMISD 0x20d9c(%RIP),%XMM0 |
0x4de674 MOV 0x28(%RBP),%R11 |
0x4de678 JNE 4de86c |
0x4de67e CMP %RSI,%R12 |
0x4de681 JGE 4de95c |
0x4de687 VXORPD 0x20b2f(%RIP){1to2},%XMM5,%XMM0 |
0x4de691 MOV %R12,%RAX |
0x4de694 NOT %RAX |
0x4de697 ADD %RAX,%RSI |
0x4de69a XOR %EDI,%EDI |
0x4de69c JMP 4de6b8 |
(4282) 0x4de69e MOV 0x30(%RBP),%RAX |
(4282) 0x4de6a2 VMOVSD %XMM1,(%RAX,%R8,8) |
(4282) 0x4de6a8 LEA 0x1(%RDI),%RAX |
(4282) 0x4de6ac CMP %RSI,%RDI |
(4282) 0x4de6af MOV %RAX,%RDI |
(4282) 0x4de6b2 JE 4de95c |
(4282) 0x4de6b8 LEA (%R12,%RDI,1),%R8 |
(4282) 0x4de6bc VMULSD (%R11,%R8,8),%XMM0,%XMM1 |
(4282) 0x4de6c2 MOV (%RBX,%R8,8),%RAX |
(4282) 0x4de6c6 MOV 0x8(%RBX,%R8,8),%R9 |
(4282) 0x4de6cb MOV %R9,%R13 |
(4282) 0x4de6ce SUB %RAX,%R13 |
(4282) 0x4de6d1 JLE 4de69e |
(4282) 0x4de6d3 MOV %R13,%R10 |
(4282) 0x4de6d6 AND $-0x4,%R10 |
(4282) 0x4de6da JE 4de755 |
(4282) 0x4de6dc MOV %RSI,%RBX |
(4282) 0x4de6df LEA -0x1(%R10),%R15 |
(4282) 0x4de6e3 LEA (%R14,%RAX,8),%RSI |
(4282) 0x4de6e7 MOV %RAX,-0x38(%RBP) |
(4282) 0x4de6eb LEA (%RDX,%RAX,8),%RAX |
(4282) 0x4de6ef VXORPD %XMM2,%XMM2,%XMM2 |
(4282) 0x4de6f3 XOR %R11D,%R11D |
(4282) 0x4de6f6 NOPW %CS:(%RAX,%RAX,1) |
(4284) 0x4de700 VMOVUPD (%RAX,%R11,8),%YMM3 |
(4284) 0x4de706 VXORPD %XMM4,%XMM4,%XMM4 |
(4284) 0x4de70a KXNORW %K0,%K0,%K1 |
(4284) 0x4de70e VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4284) 0x4de715 VFNMADD231PD (%RSI,%R11,8),%YMM4,%YMM2 |
(4284) 0x4de71b ADD $0x4,%R11 |
(4284) 0x4de71f CMP %R15,%R11 |
(4284) 0x4de722 JBE 4de700 |
(4282) 0x4de724 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4282) 0x4de72a VADDPD %XMM3,%XMM2,%XMM2 |
(4282) 0x4de72e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4282) 0x4de733 VADDSD %XMM3,%XMM2,%XMM2 |
(4282) 0x4de737 VADDSD %XMM2,%XMM1,%XMM1 |
(4282) 0x4de73b CMP %R10,%R13 |
(4282) 0x4de73e MOV %RBX,%RSI |
(4282) 0x4de741 MOV -0x30(%RBP),%RBX |
(4282) 0x4de745 MOV 0x28(%RBP),%R11 |
(4282) 0x4de749 MOV -0x38(%RBP),%RAX |
(4282) 0x4de74d JE 4de69e |
(4282) 0x4de753 JMP 4de758 |
(4282) 0x4de755 XOR %R10D,%R10D |
(4282) 0x4de758 ADD %RAX,%R10 |
(4282) 0x4de75b NOPL (%RAX,%RAX,1) |
(4283) 0x4de760 MOV (%RDX,%R10,8),%RAX |
(4283) 0x4de764 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4283) 0x4de769 VFNMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4283) 0x4de76f INC %R10 |
(4283) 0x4de772 CMP %R10,%R9 |
(4283) 0x4de775 JNE 4de760 |
(4282) 0x4de777 JMP 4de69e |
0x4de77c CMP %RSI,%R12 |
0x4de77f JGE 4de95c |
0x4de785 MOV %R12,%RAX |
0x4de788 NOT %RAX |
0x4de78b ADD %RAX,%RSI |
0x4de78e XOR %EDI,%EDI |
0x4de790 MOV %RSI,-0x30(%RBP) |
0x4de794 JMP 4de7b4 |
(4288) 0x4de796 VMULSD %XMM0,%XMM1,%XMM1 |
(4288) 0x4de79a MOV 0x30(%RBP),%RAX |
(4288) 0x4de79e VMOVSD %XMM1,(%RAX,%R8,8) |
(4288) 0x4de7a4 LEA 0x1(%RDI),%RAX |
(4288) 0x4de7a8 CMP %RSI,%RDI |
(4288) 0x4de7ab MOV %RAX,%RDI |
(4288) 0x4de7ae JE 4de95c |
(4288) 0x4de7b4 LEA (%R12,%RDI,1),%R8 |
(4288) 0x4de7b8 VMOVSD (%R15,%R8,8),%XMM1 |
(4288) 0x4de7be MOV (%RBX,%R8,8),%R11 |
(4288) 0x4de7c2 MOV 0x8(%RBX,%R8,8),%R9 |
(4288) 0x4de7c7 MOV %R9,%R13 |
(4288) 0x4de7ca SUB %R11,%R13 |
(4288) 0x4de7cd JLE 4de796 |
(4288) 0x4de7cf MOV %R13,%R10 |
(4288) 0x4de7d2 AND $-0x4,%R10 |
(4288) 0x4de7d6 JE 4de842 |
(4288) 0x4de7d8 LEA -0x1(%R10),%R15 |
(4288) 0x4de7dc LEA (%R14,%R11,8),%RSI |
(4288) 0x4de7e0 LEA (%RDX,%R11,8),%RAX |
(4288) 0x4de7e4 VXORPD %XMM2,%XMM2,%XMM2 |
(4288) 0x4de7e8 XOR %R12D,%R12D |
(4288) 0x4de7eb NOPL (%RAX,%RAX,1) |
(4290) 0x4de7f0 VMOVUPD (%RAX,%R12,8),%YMM3 |
(4290) 0x4de7f6 KXNORW %K0,%K0,%K1 |
(4290) 0x4de7fa VXORPD %XMM4,%XMM4,%XMM4 |
(4290) 0x4de7fe VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4290) 0x4de805 VFMADD231PD (%RSI,%R12,8),%YMM4,%YMM2 |
(4290) 0x4de80b ADD $0x4,%R12 |
(4290) 0x4de80f CMP %R15,%R12 |
(4290) 0x4de812 JBE 4de7f0 |
(4288) 0x4de814 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4288) 0x4de81a VADDPD %XMM3,%XMM2,%XMM2 |
(4288) 0x4de81e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4288) 0x4de823 VADDSD %XMM3,%XMM2,%XMM2 |
(4288) 0x4de827 VADDSD %XMM2,%XMM1,%XMM1 |
(4288) 0x4de82b CMP %R10,%R13 |
(4288) 0x4de82e MOV -0x38(%RBP),%R12 |
(4288) 0x4de832 MOV -0x30(%RBP),%RSI |
(4288) 0x4de836 MOV 0x28(%RBP),%R15 |
(4288) 0x4de83a JE 4de796 |
(4288) 0x4de840 JMP 4de845 |
(4288) 0x4de842 XOR %R10D,%R10D |
(4288) 0x4de845 ADD %R11,%R10 |
(4288) 0x4de848 NOPL (%RAX,%RAX,1) |
(4289) 0x4de850 MOV (%RDX,%R10,8),%RAX |
(4289) 0x4de854 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4289) 0x4de859 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4289) 0x4de85f INC %R10 |
(4289) 0x4de862 CMP %R10,%R9 |
(4289) 0x4de865 JNE 4de850 |
(4288) 0x4de867 JMP 4de796 |
0x4de86c CMP %RSI,%R12 |
0x4de86f JGE 4de95c |
0x4de875 MOV %R12,%RAX |
0x4de878 NOT %RAX |
0x4de87b ADD %RAX,%RSI |
0x4de87e XOR %EDI,%EDI |
0x4de880 JMP 4de8a0 |
(4279) 0x4de882 VMULSD %XMM0,%XMM1,%XMM1 |
(4279) 0x4de886 MOV 0x30(%RBP),%RAX |
(4279) 0x4de88a VMOVSD %XMM1,(%RAX,%R8,8) |
(4279) 0x4de890 LEA 0x1(%RDI),%RAX |
(4279) 0x4de894 CMP %RSI,%RDI |
(4279) 0x4de897 MOV %RAX,%RDI |
(4279) 0x4de89a JE 4de95c |
(4279) 0x4de8a0 LEA (%R12,%RDI,1),%R8 |
(4279) 0x4de8a4 VMULSD (%R11,%R8,8),%XMM5,%XMM1 |
(4279) 0x4de8aa MOV (%RBX,%R8,8),%RAX |
(4279) 0x4de8ae MOV 0x8(%RBX,%R8,8),%R9 |
(4279) 0x4de8b3 MOV %R9,%R13 |
(4279) 0x4de8b6 SUB %RAX,%R13 |
(4279) 0x4de8b9 JLE 4de882 |
(4279) 0x4de8bb MOV %R13,%R10 |
(4279) 0x4de8be AND $-0x4,%R10 |
(4279) 0x4de8c2 JE 4de935 |
(4279) 0x4de8c4 MOV %RSI,%RBX |
(4279) 0x4de8c7 LEA -0x1(%R10),%R15 |
(4279) 0x4de8cb LEA (%R14,%RAX,8),%RSI |
(4279) 0x4de8cf MOV %RAX,-0x38(%RBP) |
(4279) 0x4de8d3 LEA (%RDX,%RAX,8),%R11 |
(4279) 0x4de8d7 VXORPD %XMM2,%XMM2,%XMM2 |
(4279) 0x4de8db XOR %EAX,%EAX |
(4279) 0x4de8dd NOPL (%RAX) |
(4281) 0x4de8e0 VMOVUPD (%R11,%RAX,8),%YMM3 |
(4281) 0x4de8e6 VXORPD %XMM4,%XMM4,%XMM4 |
(4281) 0x4de8ea KXNORW %K0,%K0,%K1 |
(4281) 0x4de8ee VGATHERQPD (%RCX,%YMM3,8),%YMM4{%K1} |
(4281) 0x4de8f5 VFMADD231PD (%RSI,%RAX,8),%YMM4,%YMM2 |
(4281) 0x4de8fb ADD $0x4,%RAX |
(4281) 0x4de8ff CMP %R15,%RAX |
(4281) 0x4de902 JBE 4de8e0 |
(4279) 0x4de904 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4279) 0x4de90a VADDPD %XMM3,%XMM2,%XMM2 |
(4279) 0x4de90e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4279) 0x4de913 VADDSD %XMM3,%XMM2,%XMM2 |
(4279) 0x4de917 VADDSD %XMM2,%XMM1,%XMM1 |
(4279) 0x4de91b CMP %R10,%R13 |
(4279) 0x4de91e MOV %RBX,%RSI |
(4279) 0x4de921 MOV -0x30(%RBP),%RBX |
(4279) 0x4de925 MOV 0x28(%RBP),%R11 |
(4279) 0x4de929 MOV -0x38(%RBP),%RAX |
(4279) 0x4de92d JE 4de882 |
(4279) 0x4de933 JMP 4de938 |
(4279) 0x4de935 XOR %R10D,%R10D |
(4279) 0x4de938 ADD %RAX,%R10 |
(4279) 0x4de93b NOPL (%RAX,%RAX,1) |
(4280) 0x4de940 MOV (%RDX,%R10,8),%RAX |
(4280) 0x4de944 VMOVSD (%RCX,%RAX,8),%XMM2 |
(4280) 0x4de949 VFMADD231SD (%R14,%R10,8),%XMM2,%XMM1 |
(4280) 0x4de94f INC %R10 |
(4280) 0x4de952 CMP %R10,%R9 |
(4280) 0x4de955 JNE 4de940 |
(4279) 0x4de957 JMP 4de882 |
0x4de95c ADD $0x18,%RSP |
0x4de960 POP %RBX |
0x4de961 POP %R12 |
0x4de963 POP %R13 |
0x4de965 POP %R14 |
0x4de967 POP %R15 |
0x4de969 POP %RBP |
0x4de96a VZEROUPPER |
0x4de96d RET |
0x4de96e XCHG %AX,%AX |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 207 |
nb uops | 226 |
loop length | 822 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 7 |
micro-operation queue | 37.67 cycles |
front end | 37.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.07 | 12.00 | 12.00 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 12.00 |
cycles | 20.00 | 19.07 | 12.00 | 12.00 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 12.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 36.27 |
Stall cycles | 0.00 |
Front-end | 37.67 |
Dispatch | 20.00 |
Overall L1 | 37.67 |
all | 1% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 10% |
load | 5% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 3% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 10% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dc680 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dc700 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ddc57 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x67> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x259f90(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510a05,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x512a2b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e7000 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5133d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9720 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4ddc65 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ddc93 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x259f54(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510a05,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x513458,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e7000 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5133d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9720 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4ddca2 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ddcd5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x259f17(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510a05,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x51347a,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e7000 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5133d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9720 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD -0x38(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4dddfc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x20c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x20850(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4ddf1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x32c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ddd39 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x149> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2160c(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R15,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 4de01c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x42c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x2073b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de13c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x54c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x21385(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4dde5a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x26a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x214ec(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de24c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x65c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ddf59 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x369> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VUCOMISD 0x2052c(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de34c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x2051e(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de45c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x86c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de07a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x48a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x212cc(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de56c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x97c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de18a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x59a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4de28d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x69d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x201fc(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de66c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de39a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7aa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x20fac(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de77c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb8c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x20d36(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de4aa <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8ba> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x20c38(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de5ae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x9be> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x20d9c(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de86c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x20b2f(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4de6b8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xac8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de7b4 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbc4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4de8a0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcb0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 207 |
nb uops | 226 |
loop length | 822 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 7 |
micro-operation queue | 37.67 cycles |
front end | 37.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.07 | 12.00 | 12.00 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 12.00 |
cycles | 20.00 | 19.07 | 12.00 | 12.00 | 11.50 | 18.93 | 20.00 | 11.50 | 11.50 | 11.50 | 19.00 | 12.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 36.27 |
Stall cycles | 0.00 |
Front-end | 37.67 |
Dispatch | 20.00 |
Overall L1 | 37.67 |
all | 1% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 1% |
all | 10% |
load | 5% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 3% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 10% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dc680 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %R12,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4dc700 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ddc57 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x67> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x259f90(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510a05,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x512a2b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e7000 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5133d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9720 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4ddc65 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ddc93 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x259f54(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510a05,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x513458,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e7000 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5133d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9720 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4ddca2 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R13,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4ddcd5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x259f17(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x510a05,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x51347a,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e7000 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x5133d1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4e9720 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD -0x38(%RBP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4dddfc <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x20c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x20850(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4ddf1c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x32c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ddd39 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x149> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2160c(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV %R15,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JNE 4de01c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x42c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x2073b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de13c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x54c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x21385(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4dde5a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x26a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x214ec(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de24c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x65c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4ddf59 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x369> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
VUCOMISD 0x2052c(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de34c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x2051e(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de45c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x86c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de07a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x48a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x212cc(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de56c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x97c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de18a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x59a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4de28d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x69d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x201fc(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4de66c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de39a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7aa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x20fac(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de77c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb8c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x20d36(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de4aa <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8ba> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x20c38(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de5ae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x9be> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x20d9c(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
MOV 0x28(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4de86c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x20b2f(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4de6b8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xac8> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4de7b4 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbc4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %RSI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4de95c <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd6c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R12,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4de8a0 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcb0> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x18,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted– | 16.57 | 3.59 |
▼Loop 4294 - csr_matvec.c:248-341 - exec– | 0.94 | 0.18 |
○Loop 4295 - csr_matvec.c:337-339 - exec | 0.46 | 0.09 |
○Loop 4296 - csr_matvec.c:337-339 - exec | 0.12 | 0.02 |
▼Loop 4300 - csr_matvec.c:248-314 - exec– | 0.41 | 0.08 |
○Loop 4302 - csr_matvec.c:310-312 - exec | 6.58 | 1.29 |
○Loop 4301 - csr_matvec.c:310-312 - exec | 0.95 | 0.19 |
▼Loop 4312 - csr_matvec.c:248-263 - exec– | 0.32 | 0.06 |
○Loop 4314 - csr_matvec.c:259-261 - exec | 5.98 | 1.17 |
○Loop 4313 - csr_matvec.c:259-261 - exec | 0.82 | 0.16 |
▼Loop 4291 - csr_matvec.c:248-353 - exec– | 0 | 0 |
○Loop 4292 - csr_matvec.c:349-351 - exec | 0 | 0 |
○Loop 4293 - csr_matvec.c:349-351 - exec | 0 | 0 |
▼Loop 4279 - csr_matvec.c:248-404 - exec– | 0 | 0 |
○Loop 4280 - csr_matvec.c:400-402 - exec | 0 | 0 |
○Loop 4281 - csr_matvec.c:400-402 - exec | 0 | 0 |
▼Loop 4297 - csr_matvec.c:248-326 - exec– | 0 | 0 |
○Loop 4298 - csr_matvec.c:322-324 - exec | 0 | 0 |
○Loop 4299 - csr_matvec.c:322-324 - exec | 0 | 0 |
▼Loop 4282 - csr_matvec.c:248-392 - exec– | 0 | 0 |
○Loop 4284 - csr_matvec.c:388-390 - exec | 0 | 0 |
○Loop 4283 - csr_matvec.c:388-390 - exec | 0 | 0 |
▼Loop 4306 - csr_matvec.c:248-287 - exec– | 0 | 0 |
○Loop 4308 - csr_matvec.c:283-285 - exec | 0 | 0 |
○Loop 4307 - csr_matvec.c:283-285 - exec | 0 | 0 |
▼Loop 4285 - csr_matvec.c:248-380 - exec– | 0 | 0 |
○Loop 4286 - csr_matvec.c:376-378 - exec | 0 | 0 |
○Loop 4287 - csr_matvec.c:376-378 - exec | 0 | 0 |
▼Loop 4309 - csr_matvec.c:248-275 - exec– | 0 | 0 |
○Loop 4310 - csr_matvec.c:271-273 - exec | 0 | 0 |
○Loop 4311 - csr_matvec.c:271-273 - exec | 0 | 0 |
▼Loop 4303 - csr_matvec.c:248-302 - exec– | 0 | 0 |
○Loop 4305 - csr_matvec.c:298-300 - exec | 0 | 0 |
○Loop 4304 - csr_matvec.c:298-300 - exec | 0 | 0 |
▼Loop 4288 - csr_matvec.c:248-365 - exec– | 0 | 0 |
○Loop 4290 - csr_matvec.c:361-363 - exec | 0 | 0 |
○Loop 4289 - csr_matvec.c:361-363 - exec | 0 | 0 |