Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 11.2% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 11.2% |
---|
/scratch_na/users/xoserete/qaas_runs/171-172-8217/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
0x4cd350 PUSH %RBP |
0x4cd351 MOV %RSP,%RBP |
0x4cd354 PUSH %R15 |
0x4cd356 PUSH %R14 |
0x4cd358 PUSH %R13 |
0x4cd35a PUSH %R12 |
0x4cd35c PUSH %RBX |
0x4cd35d SUB $0x28,%RSP |
0x4cd361 MOV %R9,%R12 |
0x4cd364 MOV %R8,-0x48(%RBP) |
0x4cd368 MOV %RCX,%R15 |
0x4cd36b MOV %RDX,%R13 |
0x4cd36e MOV %RCX,%RDI |
0x4cd371 CALL 4cbd60 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> |
0x4cd376 MOV %RAX,%R14 |
0x4cd379 MOV %R15,%RDI |
0x4cd37c CALL 4cbde0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> |
0x4cd381 MOV %RAX,%R15 |
0x4cd384 CMP %RAX,%R14 |
0x4cd387 JLE 4cd3b7 |
0x4cd389 MOV 0x24d870(%RIP),%RDI |
0x4cd390 MOV $0x4f4525,%ESI |
0x4cd395 MOV $0x4f653b,%EDX |
0x4cd39a XOR %EAX,%EAX |
0x4cd39c CALL 4d58d0 <hypre_fprintf> |
0x4cd3a1 MOV $0x4f6ee1,%EDI |
0x4cd3a6 MOV $0xf8,%ESI |
0x4cd3ab MOV $0x1,%EDX |
0x4cd3b0 XOR %ECX,%ECX |
0x4cd3b2 CALL 4d8210 <hypre_error_handler> |
0x4cd3b7 MOV 0x18(%RBP),%RBX |
0x4cd3bb TEST %R14,%R14 |
0x4cd3be JS 4cd3c5 |
0x4cd3c0 CMP %RBX,%R14 |
0x4cd3c3 JLE 4cd3f3 |
0x4cd3c5 MOV 0x24d834(%RIP),%RDI |
0x4cd3cc MOV $0x4f4525,%ESI |
0x4cd3d1 MOV $0x4f6f68,%EDX |
0x4cd3d6 XOR %EAX,%EAX |
0x4cd3d8 CALL 4d58d0 <hypre_fprintf> |
0x4cd3dd MOV $0x4f6ee1,%EDI |
0x4cd3e2 MOV $0xf9,%ESI |
0x4cd3e7 MOV $0x1,%EDX |
0x4cd3ec XOR %ECX,%ECX |
0x4cd3ee CALL 4d8210 <hypre_error_handler> |
0x4cd3f3 VMOVSD 0x38(%RBP),%XMM5 |
0x4cd3f8 TEST %R15,%R15 |
0x4cd3fb JS 4cd402 |
0x4cd3fd CMP %RBX,%R15 |
0x4cd400 JLE 4cd435 |
0x4cd402 MOV 0x24d7f7(%RIP),%RDI |
0x4cd409 MOV $0x4f4525,%ESI |
0x4cd40e MOV $0x4f6f8a,%EDX |
0x4cd413 XOR %EAX,%EAX |
0x4cd415 CALL 4d58d0 <hypre_fprintf> |
0x4cd41a MOV $0x4f6ee1,%EDI |
0x4cd41f MOV $0xfa,%ESI |
0x4cd424 MOV $0x1,%EDX |
0x4cd429 XOR %ECX,%ECX |
0x4cd42b CALL 4d8210 <hypre_error_handler> |
0x4cd430 VMOVSD 0x38(%RBP),%XMM5 |
0x4cd435 MOV 0x30(%RBP),%RSI |
0x4cd439 VMOVQ %R13,%XMM0 |
0x4cd43e VXORPD %XMM1,%XMM1,%XMM1 |
0x4cd442 VUCOMISD %XMM1,%XMM5 |
0x4cd446 MOV %R14,-0x40(%RBP) |
0x4cd44a JNE 4cd56d |
0x4cd450 VUCOMISD 0x14bd8(%RIP),%XMM0 |
0x4cd458 JNE 4cd6ae |
0x4cd45e CMP %R15,%R14 |
0x4cd461 JGE 4ce20e |
0x4cd467 MOV (%R12),%RDX |
0x4cd46b MOV (%RSI),%RBX |
0x4cd46e MOV %R14,%RAX |
0x4cd471 NOT %RAX |
0x4cd474 ADD %RAX,%R15 |
0x4cd477 XOR %EDI,%EDI |
0x4cd479 MOV %R15,-0x38(%RBP) |
0x4cd47d MOV %RBX,-0x30(%RBP) |
0x4cd481 JMP 4cd4a6 |
0x4cd483 NOPW %CS:(%RAX,%RAX,1) |
(4060) 0x4cd490 VMOVSD %XMM0,(%RBX,%R8,8) |
(4060) 0x4cd496 LEA 0x1(%RDI),%RAX |
(4060) 0x4cd49a CMP %R15,%RDI |
(4060) 0x4cd49d MOV %RAX,%RDI |
(4060) 0x4cd4a0 JE 4ce20e |
(4060) 0x4cd4a6 LEA (%R14,%RDI,1),%R8 |
(4060) 0x4cd4aa MOV (%RDX,%R8,8),%RAX |
(4060) 0x4cd4ae MOV 0x8(%RDX,%R8,8),%R9 |
(4060) 0x4cd4b3 VXORPD %XMM0,%XMM0,%XMM0 |
(4060) 0x4cd4b7 MOV %R9,%RCX |
(4060) 0x4cd4ba SUB %RAX,%RCX |
(4060) 0x4cd4bd JLE 4cd490 |
(4060) 0x4cd4bf MOV -0x48(%RBP),%RSI |
(4060) 0x4cd4c3 MOV (%RSI),%R10 |
(4060) 0x4cd4c6 MOV 0x20(%RBP),%RSI |
(4060) 0x4cd4ca MOV (%RSI),%R11 |
(4060) 0x4cd4cd MOV 0x10(%RBP),%RSI |
(4060) 0x4cd4d1 MOV (%RSI),%R12 |
(4060) 0x4cd4d4 MOV %RCX,%R13 |
(4060) 0x4cd4d7 AND $-0x4,%R13 |
(4060) 0x4cd4db JE 4cd53e |
(4060) 0x4cd4dd LEA -0x1(%R13),%RBX |
(4060) 0x4cd4e1 LEA (%R10,%RAX,8),%R14 |
(4060) 0x4cd4e5 LEA (%R12,%RAX,8),%R15 |
(4060) 0x4cd4e9 VXORPD %XMM0,%XMM0,%XMM0 |
(4060) 0x4cd4ed XOR %ESI,%ESI |
(4060) 0x4cd4ef NOP |
(4062) 0x4cd4f0 VMOVUPD (%R15,%RSI,8),%YMM1 |
(4062) 0x4cd4f6 KXNORW %K0,%K0,%K1 |
(4062) 0x4cd4fa VXORPD %XMM2,%XMM2,%XMM2 |
(4062) 0x4cd4fe VGATHERQPD (%R11,%YMM1,8),%YMM2{%K1} |
(4062) 0x4cd505 VFMADD231PD (%R14,%RSI,8),%YMM2,%YMM0 |
(4062) 0x4cd50b ADD $0x4,%RSI |
(4062) 0x4cd50f CMP %RBX,%RSI |
(4062) 0x4cd512 JBE 4cd4f0 |
(4060) 0x4cd514 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(4060) 0x4cd51a VADDPD %XMM1,%XMM0,%XMM0 |
(4060) 0x4cd51e VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(4060) 0x4cd523 VADDSD %XMM1,%XMM0,%XMM0 |
(4060) 0x4cd527 CMP %R13,%RCX |
(4060) 0x4cd52a MOV -0x40(%RBP),%R14 |
(4060) 0x4cd52e MOV -0x38(%RBP),%R15 |
(4060) 0x4cd532 MOV -0x30(%RBP),%RBX |
(4060) 0x4cd536 JE 4cd490 |
(4060) 0x4cd53c JMP 4cd541 |
(4060) 0x4cd53e XOR %R13D,%R13D |
(4060) 0x4cd541 ADD %RAX,%R13 |
(4060) 0x4cd544 NOPW %CS:(%RAX,%RAX,1) |
(4061) 0x4cd550 MOV (%R12,%R13,8),%RAX |
(4061) 0x4cd554 VMOVSD (%R11,%RAX,8),%XMM1 |
(4061) 0x4cd55a VFMADD231SD (%R10,%R13,8),%XMM1,%XMM0 |
(4061) 0x4cd560 INC %R13 |
(4061) 0x4cd563 CMP %R13,%R9 |
(4061) 0x4cd566 JNE 4cd550 |
(4060) 0x4cd568 JMP 4cd490 |
0x4cd56d MOV 0x28(%RBP),%RBX |
0x4cd571 VUCOMISD 0x159b7(%RIP),%XMM5 |
0x4cd579 JNE 4cd7cd |
0x4cd57f VUCOMISD 0x14aa9(%RIP),%XMM0 |
0x4cd587 JNE 4cd8fe |
0x4cd58d CMP %R15,%R14 |
0x4cd590 JGE 4ce20e |
0x4cd596 MOV (%R12),%RDI |
0x4cd59a MOV (%RSI),%RSI |
0x4cd59d MOV %R14,%RAX |
0x4cd5a0 NOT %RAX |
0x4cd5a3 ADD %RAX,%R15 |
0x4cd5a6 XOR %R8D,%R8D |
0x4cd5a9 VMOVDDUP 0x1572f(%RIP),%XMM0 |
0x4cd5b1 MOV %R15,-0x38(%RBP) |
0x4cd5b5 MOV %RSI,-0x30(%RBP) |
0x4cd5b9 JMP 4cd5d6 |
0x4cd5bb NOPL (%RAX,%RAX,1) |
(4051) 0x4cd5c0 VMOVSD %XMM1,(%RSI,%R9,8) |
(4051) 0x4cd5c6 LEA 0x1(%R8),%RAX |
(4051) 0x4cd5ca CMP %R15,%R8 |
(4051) 0x4cd5cd MOV %RAX,%R8 |
(4051) 0x4cd5d0 JE 4ce20e |
(4051) 0x4cd5d6 LEA (%R14,%R8,1),%R9 |
(4051) 0x4cd5da VMOVSD (%RBX,%R9,8),%XMM1 |
(4051) 0x4cd5e0 VXORPD %XMM0,%XMM1,%XMM1 |
(4051) 0x4cd5e4 MOV (%RDI,%R9,8),%RAX |
(4051) 0x4cd5e8 MOV 0x8(%RDI,%R9,8),%R10 |
(4051) 0x4cd5ed MOV %R10,%RCX |
(4051) 0x4cd5f0 SUB %RAX,%RCX |
(4051) 0x4cd5f3 JLE 4cd5c0 |
(4051) 0x4cd5f5 MOV -0x48(%RBP),%RDX |
(4051) 0x4cd5f9 MOV (%RDX),%R11 |
(4051) 0x4cd5fc MOV 0x20(%RBP),%RDX |
(4051) 0x4cd600 MOV (%RDX),%R12 |
(4051) 0x4cd603 MOV 0x10(%RBP),%RDX |
(4051) 0x4cd607 MOV (%RDX),%R13 |
(4051) 0x4cd60a MOV %RCX,%RDX |
(4051) 0x4cd60d AND $-0x4,%RDX |
(4051) 0x4cd611 JE 4cd686 |
(4051) 0x4cd613 LEA -0x1(%RDX),%RBX |
(4051) 0x4cd617 LEA (%R11,%RAX,8),%R14 |
(4051) 0x4cd61b LEA (%R13,%RAX,8),%R15 |
(4051) 0x4cd620 VXORPD %XMM2,%XMM2,%XMM2 |
(4051) 0x4cd624 XOR %ESI,%ESI |
(4051) 0x4cd626 NOPW %CS:(%RAX,%RAX,1) |
(4053) 0x4cd630 VMOVUPD (%R15,%RSI,8),%YMM3 |
(4053) 0x4cd636 KXNORW %K0,%K0,%K1 |
(4053) 0x4cd63a VXORPD %XMM4,%XMM4,%XMM4 |
(4053) 0x4cd63e VGATHERQPD (%R12,%YMM3,8),%YMM4{%K1} |
(4053) 0x4cd645 VFMADD231PD (%R14,%RSI,8),%YMM4,%YMM2 |
(4053) 0x4cd64b ADD $0x4,%RSI |
(4053) 0x4cd64f CMP %RBX,%RSI |
(4053) 0x4cd652 JBE 4cd630 |
(4051) 0x4cd654 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4051) 0x4cd65a VADDPD %XMM3,%XMM2,%XMM2 |
(4051) 0x4cd65e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4051) 0x4cd663 VADDSD %XMM3,%XMM2,%XMM2 |
(4051) 0x4cd667 VADDSD %XMM2,%XMM1,%XMM1 |
(4051) 0x4cd66b CMP %RDX,%RCX |
(4051) 0x4cd66e MOV -0x40(%RBP),%R14 |
(4051) 0x4cd672 MOV -0x38(%RBP),%R15 |
(4051) 0x4cd676 MOV 0x28(%RBP),%RBX |
(4051) 0x4cd67a MOV -0x30(%RBP),%RSI |
(4051) 0x4cd67e JE 4cd5c0 |
(4051) 0x4cd684 JMP 4cd688 |
(4051) 0x4cd686 XOR %EDX,%EDX |
(4051) 0x4cd688 ADD %RAX,%RDX |
(4051) 0x4cd68b NOPL (%RAX,%RAX,1) |
(4052) 0x4cd690 MOV (%R13,%RDX,8),%RAX |
(4052) 0x4cd695 VMOVSD (%R12,%RAX,8),%XMM2 |
(4052) 0x4cd69b VFMADD231SD (%R11,%RDX,8),%XMM2,%XMM1 |
(4052) 0x4cd6a1 INC %RDX |
(4052) 0x4cd6a4 CMP %RDX,%R10 |
(4052) 0x4cd6a7 JNE 4cd690 |
(4051) 0x4cd6a9 JMP 4cd5c0 |
0x4cd6ae VUCOMISD 0x1587a(%RIP),%XMM0 |
0x4cd6b6 JNE 4cda2e |
0x4cd6bc CMP %R15,%R14 |
0x4cd6bf JGE 4ce20e |
0x4cd6c5 MOV (%R12),%RDX |
0x4cd6c9 MOV (%RSI),%RBX |
0x4cd6cc MOV %R14,%RAX |
0x4cd6cf NOT %RAX |
0x4cd6d2 ADD %RAX,%R15 |
0x4cd6d5 XOR %EDI,%EDI |
0x4cd6d7 MOV %R15,-0x38(%RBP) |
0x4cd6db MOV %RBX,-0x30(%RBP) |
0x4cd6df JMP 4cd706 |
0x4cd6e1 NOPW %CS:(%RAX,%RAX,1) |
(4057) 0x4cd6f0 VMOVSD %XMM0,(%RBX,%R8,8) |
(4057) 0x4cd6f6 LEA 0x1(%RDI),%RAX |
(4057) 0x4cd6fa CMP %R15,%RDI |
(4057) 0x4cd6fd MOV %RAX,%RDI |
(4057) 0x4cd700 JE 4ce20e |
(4057) 0x4cd706 LEA (%R14,%RDI,1),%R8 |
(4057) 0x4cd70a MOV (%RDX,%R8,8),%RAX |
(4057) 0x4cd70e MOV 0x8(%RDX,%R8,8),%R9 |
(4057) 0x4cd713 VXORPD %XMM0,%XMM0,%XMM0 |
(4057) 0x4cd717 MOV %R9,%RCX |
(4057) 0x4cd71a SUB %RAX,%RCX |
(4057) 0x4cd71d JLE 4cd6f0 |
(4057) 0x4cd71f MOV -0x48(%RBP),%RSI |
(4057) 0x4cd723 MOV (%RSI),%R10 |
(4057) 0x4cd726 MOV 0x20(%RBP),%RSI |
(4057) 0x4cd72a MOV (%RSI),%R11 |
(4057) 0x4cd72d MOV 0x10(%RBP),%RSI |
(4057) 0x4cd731 MOV (%RSI),%R12 |
(4057) 0x4cd734 MOV %RCX,%R13 |
(4057) 0x4cd737 AND $-0x4,%R13 |
(4057) 0x4cd73b JE 4cd79e |
(4057) 0x4cd73d LEA -0x1(%R13),%RBX |
(4057) 0x4cd741 LEA (%R10,%RAX,8),%R14 |
(4057) 0x4cd745 LEA (%R12,%RAX,8),%R15 |
(4057) 0x4cd749 VXORPD %XMM0,%XMM0,%XMM0 |
(4057) 0x4cd74d XOR %ESI,%ESI |
(4057) 0x4cd74f NOP |
(4059) 0x4cd750 VMOVUPD (%R15,%RSI,8),%YMM1 |
(4059) 0x4cd756 VXORPD %XMM2,%XMM2,%XMM2 |
(4059) 0x4cd75a KXNORW %K0,%K0,%K1 |
(4059) 0x4cd75e VGATHERQPD (%R11,%YMM1,8),%YMM2{%K1} |
(4059) 0x4cd765 VFNMADD231PD (%R14,%RSI,8),%YMM2,%YMM0 |
(4059) 0x4cd76b ADD $0x4,%RSI |
(4059) 0x4cd76f CMP %RBX,%RSI |
(4059) 0x4cd772 JBE 4cd750 |
(4057) 0x4cd774 VEXTRACTF128 $0x1,%YMM0,%XMM1 |
(4057) 0x4cd77a VADDPD %XMM1,%XMM0,%XMM0 |
(4057) 0x4cd77e VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(4057) 0x4cd783 VADDSD %XMM1,%XMM0,%XMM0 |
(4057) 0x4cd787 CMP %R13,%RCX |
(4057) 0x4cd78a MOV -0x40(%RBP),%R14 |
(4057) 0x4cd78e MOV -0x38(%RBP),%R15 |
(4057) 0x4cd792 MOV -0x30(%RBP),%RBX |
(4057) 0x4cd796 JE 4cd6f0 |
(4057) 0x4cd79c JMP 4cd7a1 |
(4057) 0x4cd79e XOR %R13D,%R13D |
(4057) 0x4cd7a1 ADD %RAX,%R13 |
(4057) 0x4cd7a4 NOPW %CS:(%RAX,%RAX,1) |
(4058) 0x4cd7b0 MOV (%R12,%R13,8),%RAX |
(4058) 0x4cd7b4 VMOVSD (%R11,%RAX,8),%XMM1 |
(4058) 0x4cd7ba VFNMADD231SD (%R10,%R13,8),%XMM1,%XMM0 |
(4058) 0x4cd7c0 INC %R13 |
(4058) 0x4cd7c3 CMP %R13,%R9 |
(4058) 0x4cd7c6 JNE 4cd7b0 |
(4057) 0x4cd7c8 JMP 4cd6f0 |
0x4cd7cd VUCOMISD 0x1485b(%RIP),%XMM5 |
0x4cd7d5 JNE 4cdb4d |
0x4cd7db VUCOMISD 0x1484d(%RIP),%XMM0 |
0x4cd7e3 JNE 4cdc7e |
0x4cd7e9 CMP %R15,%R14 |
0x4cd7ec JGE 4ce20e |
0x4cd7f2 MOV (%R12),%RDI |
0x4cd7f6 MOV (%RSI),%RSI |
0x4cd7f9 MOV %R14,%RAX |
0x4cd7fc NOT %RAX |
0x4cd7ff ADD %RAX,%R15 |
0x4cd802 XOR %R8D,%R8D |
0x4cd805 MOV %R15,-0x38(%RBP) |
0x4cd809 MOV %RSI,-0x30(%RBP) |
0x4cd80d JMP 4cd826 |
0x4cd80f NOP |
(4042) 0x4cd810 VMOVSD %XMM0,(%RSI,%R9,8) |
(4042) 0x4cd816 LEA 0x1(%R8),%RAX |
(4042) 0x4cd81a CMP %R15,%R8 |
(4042) 0x4cd81d MOV %RAX,%R8 |
(4042) 0x4cd820 JE 4ce20e |
(4042) 0x4cd826 LEA (%R14,%R8,1),%R9 |
(4042) 0x4cd82a VMOVSD (%RBX,%R9,8),%XMM0 |
(4042) 0x4cd830 MOV (%RDI,%R9,8),%RAX |
(4042) 0x4cd834 MOV 0x8(%RDI,%R9,8),%R10 |
(4042) 0x4cd839 MOV %R10,%RCX |
(4042) 0x4cd83c SUB %RAX,%RCX |
(4042) 0x4cd83f JLE 4cd810 |
(4042) 0x4cd841 MOV -0x48(%RBP),%RDX |
(4042) 0x4cd845 MOV (%RDX),%R11 |
(4042) 0x4cd848 MOV 0x20(%RBP),%RDX |
(4042) 0x4cd84c MOV (%RDX),%R12 |
(4042) 0x4cd84f MOV 0x10(%RBP),%RDX |
(4042) 0x4cd853 MOV (%RDX),%R13 |
(4042) 0x4cd856 MOV %RCX,%RDX |
(4042) 0x4cd859 AND $-0x4,%RDX |
(4042) 0x4cd85d JE 4cd8d6 |
(4042) 0x4cd85f LEA -0x1(%RDX),%RBX |
(4042) 0x4cd863 LEA (%R11,%RAX,8),%RSI |
(4042) 0x4cd867 LEA (%R13,%RAX,8),%R14 |
(4042) 0x4cd86c VXORPD %XMM1,%XMM1,%XMM1 |
(4042) 0x4cd870 XOR %R15D,%R15D |
(4042) 0x4cd873 NOPW %CS:(%RAX,%RAX,1) |
(4044) 0x4cd880 VMOVUPD (%R14,%R15,8),%YMM2 |
(4044) 0x4cd886 VXORPD %XMM3,%XMM3,%XMM3 |
(4044) 0x4cd88a KXNORW %K0,%K0,%K1 |
(4044) 0x4cd88e VGATHERQPD (%R12,%YMM2,8),%YMM3{%K1} |
(4044) 0x4cd895 VFMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(4044) 0x4cd89b ADD $0x4,%R15 |
(4044) 0x4cd89f CMP %RBX,%R15 |
(4044) 0x4cd8a2 JBE 4cd880 |
(4042) 0x4cd8a4 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4042) 0x4cd8aa VADDPD %XMM2,%XMM1,%XMM1 |
(4042) 0x4cd8ae VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4042) 0x4cd8b3 VADDSD %XMM2,%XMM1,%XMM1 |
(4042) 0x4cd8b7 VADDSD %XMM1,%XMM0,%XMM0 |
(4042) 0x4cd8bb CMP %RDX,%RCX |
(4042) 0x4cd8be MOV -0x40(%RBP),%R14 |
(4042) 0x4cd8c2 MOV -0x38(%RBP),%R15 |
(4042) 0x4cd8c6 MOV 0x28(%RBP),%RBX |
(4042) 0x4cd8ca MOV -0x30(%RBP),%RSI |
(4042) 0x4cd8ce JE 4cd810 |
(4042) 0x4cd8d4 JMP 4cd8d8 |
(4042) 0x4cd8d6 XOR %EDX,%EDX |
(4042) 0x4cd8d8 ADD %RAX,%RDX |
(4042) 0x4cd8db NOPL (%RAX,%RAX,1) |
(4043) 0x4cd8e0 MOV (%R13,%RDX,8),%RAX |
(4043) 0x4cd8e5 VMOVSD (%R12,%RAX,8),%XMM1 |
(4043) 0x4cd8eb VFMADD231SD (%R11,%RDX,8),%XMM1,%XMM0 |
(4043) 0x4cd8f1 INC %RDX |
(4043) 0x4cd8f4 CMP %RDX,%R10 |
(4043) 0x4cd8f7 JNE 4cd8e0 |
(4042) 0x4cd8f9 JMP 4cd810 |
0x4cd8fe VUCOMISD 0x1562a(%RIP),%XMM0 |
0x4cd906 JNE 4cddae |
0x4cd90c CMP %R15,%R14 |
0x4cd90f JGE 4ce20e |
0x4cd915 MOV (%R12),%RDI |
0x4cd919 MOV (%RSI),%RSI |
0x4cd91c MOV %R14,%RAX |
0x4cd91f NOT %RAX |
0x4cd922 ADD %RAX,%R15 |
0x4cd925 XOR %R8D,%R8D |
0x4cd928 MOV %R15,-0x38(%RBP) |
0x4cd92c MOV %RSI,-0x30(%RBP) |
0x4cd930 JMP 4cd956 |
0x4cd932 NOPW %CS:(%RAX,%RAX,1) |
(4048) 0x4cd940 VMOVSD %XMM0,(%RSI,%R9,8) |
(4048) 0x4cd946 LEA 0x1(%R8),%RAX |
(4048) 0x4cd94a CMP %R15,%R8 |
(4048) 0x4cd94d MOV %RAX,%R8 |
(4048) 0x4cd950 JE 4ce20e |
(4048) 0x4cd956 LEA (%R14,%R8,1),%R9 |
(4048) 0x4cd95a VMOVSD (%RBX,%R9,8),%XMM0 |
(4048) 0x4cd960 MOV (%RDI,%R9,8),%RAX |
(4048) 0x4cd964 MOV 0x8(%RDI,%R9,8),%R10 |
(4048) 0x4cd969 MOV %R10,%RCX |
(4048) 0x4cd96c SUB %RAX,%RCX |
(4048) 0x4cd96f JLE 4cd940 |
(4048) 0x4cd971 MOV -0x48(%RBP),%RDX |
(4048) 0x4cd975 MOV (%RDX),%R11 |
(4048) 0x4cd978 MOV 0x20(%RBP),%RDX |
(4048) 0x4cd97c MOV (%RDX),%R12 |
(4048) 0x4cd97f MOV 0x10(%RBP),%RDX |
(4048) 0x4cd983 MOV (%RDX),%R13 |
(4048) 0x4cd986 MOV %RCX,%RDX |
(4048) 0x4cd989 AND $-0x4,%RDX |
(4048) 0x4cd98d JE 4cda06 |
(4048) 0x4cd98f LEA -0x1(%RDX),%RBX |
(4048) 0x4cd993 LEA (%R11,%RAX,8),%RSI |
(4048) 0x4cd997 LEA (%R13,%RAX,8),%R14 |
(4048) 0x4cd99c VXORPD %XMM1,%XMM1,%XMM1 |
(4048) 0x4cd9a0 XOR %R15D,%R15D |
(4048) 0x4cd9a3 NOPW %CS:(%RAX,%RAX,1) |
(4050) 0x4cd9b0 VMOVUPD (%R14,%R15,8),%YMM2 |
(4050) 0x4cd9b6 KXNORW %K0,%K0,%K1 |
(4050) 0x4cd9ba VXORPD %XMM3,%XMM3,%XMM3 |
(4050) 0x4cd9be VGATHERQPD (%R12,%YMM2,8),%YMM3{%K1} |
(4050) 0x4cd9c5 VFNMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(4050) 0x4cd9cb ADD $0x4,%R15 |
(4050) 0x4cd9cf CMP %RBX,%R15 |
(4050) 0x4cd9d2 JBE 4cd9b0 |
(4048) 0x4cd9d4 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4048) 0x4cd9da VADDPD %XMM2,%XMM1,%XMM1 |
(4048) 0x4cd9de VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4048) 0x4cd9e3 VADDSD %XMM2,%XMM1,%XMM1 |
(4048) 0x4cd9e7 VADDSD %XMM1,%XMM0,%XMM0 |
(4048) 0x4cd9eb CMP %RDX,%RCX |
(4048) 0x4cd9ee MOV -0x40(%RBP),%R14 |
(4048) 0x4cd9f2 MOV -0x38(%RBP),%R15 |
(4048) 0x4cd9f6 MOV 0x28(%RBP),%RBX |
(4048) 0x4cd9fa MOV -0x30(%RBP),%RSI |
(4048) 0x4cd9fe JE 4cd940 |
(4048) 0x4cda04 JMP 4cda08 |
(4048) 0x4cda06 XOR %EDX,%EDX |
(4048) 0x4cda08 ADD %RAX,%RDX |
(4048) 0x4cda0b NOPL (%RAX,%RAX,1) |
(4049) 0x4cda10 MOV (%R13,%RDX,8),%RAX |
(4049) 0x4cda15 VMOVSD (%R12,%RAX,8),%XMM1 |
(4049) 0x4cda1b VFNMADD231SD (%R11,%RDX,8),%XMM1,%XMM0 |
(4049) 0x4cda21 INC %RDX |
(4049) 0x4cda24 CMP %RDX,%R10 |
(4049) 0x4cda27 JNE 4cda10 |
(4048) 0x4cda29 JMP 4cd940 |
0x4cda2e CMP %R15,%R14 |
0x4cda31 JGE 4ce20e |
0x4cda37 MOV (%R12),%RDX |
0x4cda3b MOV (%RSI),%RBX |
0x4cda3e MOV %R14,%RAX |
0x4cda41 NOT %RAX |
0x4cda44 ADD %RAX,%R15 |
0x4cda47 XOR %EDI,%EDI |
0x4cda49 MOV %R15,-0x38(%RBP) |
0x4cda4d MOV %RBX,-0x30(%RBP) |
0x4cda51 JMP 4cda7a |
0x4cda53 NOPW %CS:(%RAX,%RAX,1) |
(4054) 0x4cda60 VMULSD %XMM0,%XMM1,%XMM1 |
(4054) 0x4cda64 VMOVSD %XMM1,(%RBX,%R8,8) |
(4054) 0x4cda6a LEA 0x1(%RDI),%RAX |
(4054) 0x4cda6e CMP %R15,%RDI |
(4054) 0x4cda71 MOV %RAX,%RDI |
(4054) 0x4cda74 JE 4ce20e |
(4054) 0x4cda7a LEA (%R14,%RDI,1),%R8 |
(4054) 0x4cda7e MOV (%RDX,%R8,8),%RAX |
(4054) 0x4cda82 MOV 0x8(%RDX,%R8,8),%R9 |
(4054) 0x4cda87 VXORPD %XMM1,%XMM1,%XMM1 |
(4054) 0x4cda8b MOV %R9,%RCX |
(4054) 0x4cda8e SUB %RAX,%RCX |
(4054) 0x4cda91 JLE 4cda60 |
(4054) 0x4cda93 MOV -0x48(%RBP),%RSI |
(4054) 0x4cda97 MOV (%RSI),%R10 |
(4054) 0x4cda9a MOV 0x20(%RBP),%RSI |
(4054) 0x4cda9e MOV (%RSI),%R11 |
(4054) 0x4cdaa1 MOV 0x10(%RBP),%RSI |
(4054) 0x4cdaa5 MOV (%RSI),%R12 |
(4054) 0x4cdaa8 MOV %RCX,%R13 |
(4054) 0x4cdaab AND $-0x4,%R13 |
(4054) 0x4cdaaf JE 4cdb1e |
(4054) 0x4cdab1 LEA -0x1(%R13),%RBX |
(4054) 0x4cdab5 LEA (%R10,%RAX,8),%R14 |
(4054) 0x4cdab9 LEA (%R12,%RAX,8),%R15 |
(4054) 0x4cdabd VXORPD %XMM1,%XMM1,%XMM1 |
(4054) 0x4cdac1 XOR %ESI,%ESI |
(4054) 0x4cdac3 NOPW %CS:(%RAX,%RAX,1) |
(4056) 0x4cdad0 VMOVUPD (%R15,%RSI,8),%YMM2 |
(4056) 0x4cdad6 VXORPD %XMM3,%XMM3,%XMM3 |
(4056) 0x4cdada KXNORW %K0,%K0,%K1 |
(4056) 0x4cdade VGATHERQPD (%R11,%YMM2,8),%YMM3{%K1} |
(4056) 0x4cdae5 VFMADD231PD (%R14,%RSI,8),%YMM3,%YMM1 |
(4056) 0x4cdaeb ADD $0x4,%RSI |
(4056) 0x4cdaef CMP %RBX,%RSI |
(4056) 0x4cdaf2 JBE 4cdad0 |
(4054) 0x4cdaf4 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4054) 0x4cdafa VADDPD %XMM2,%XMM1,%XMM1 |
(4054) 0x4cdafe VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4054) 0x4cdb03 VADDSD %XMM2,%XMM1,%XMM1 |
(4054) 0x4cdb07 CMP %R13,%RCX |
(4054) 0x4cdb0a MOV -0x40(%RBP),%R14 |
(4054) 0x4cdb0e MOV -0x38(%RBP),%R15 |
(4054) 0x4cdb12 MOV -0x30(%RBP),%RBX |
(4054) 0x4cdb16 JE 4cda60 |
(4054) 0x4cdb1c JMP 4cdb21 |
(4054) 0x4cdb1e XOR %R13D,%R13D |
(4054) 0x4cdb21 ADD %RAX,%R13 |
(4054) 0x4cdb24 NOPW %CS:(%RAX,%RAX,1) |
(4055) 0x4cdb30 MOV (%R12,%R13,8),%RAX |
(4055) 0x4cdb34 VMOVSD (%R11,%RAX,8),%XMM2 |
(4055) 0x4cdb3a VFMADD231SD (%R10,%R13,8),%XMM2,%XMM1 |
(4055) 0x4cdb40 INC %R13 |
(4055) 0x4cdb43 CMP %R13,%R9 |
(4055) 0x4cdb46 JNE 4cdb30 |
(4054) 0x4cdb48 JMP 4cda60 |
0x4cdb4d VUCOMISD 0x144db(%RIP),%XMM0 |
0x4cdb55 JNE 4cdece |
0x4cdb5b CMP %R15,%R14 |
0x4cdb5e JGE 4ce20e |
0x4cdb64 MOV (%R12),%RDI |
0x4cdb68 MOV (%RSI),%RSI |
0x4cdb6b MOV %R14,%RAX |
0x4cdb6e NOT %RAX |
0x4cdb71 ADD %RAX,%R15 |
0x4cdb74 XOR %R8D,%R8D |
0x4cdb77 MOV %R15,-0x38(%RBP) |
0x4cdb7b MOV %RSI,-0x30(%RBP) |
0x4cdb7f JMP 4cdba6 |
0x4cdb81 NOPW %CS:(%RAX,%RAX,1) |
(4033) 0x4cdb90 VMOVSD %XMM0,(%RSI,%R9,8) |
(4033) 0x4cdb96 LEA 0x1(%R8),%RAX |
(4033) 0x4cdb9a CMP %R15,%R8 |
(4033) 0x4cdb9d MOV %RAX,%R8 |
(4033) 0x4cdba0 JE 4ce20e |
(4033) 0x4cdba6 LEA (%R14,%R8,1),%R9 |
(4033) 0x4cdbaa VMULSD (%RBX,%R9,8),%XMM5,%XMM0 |
(4033) 0x4cdbb0 MOV (%RDI,%R9,8),%RAX |
(4033) 0x4cdbb4 MOV 0x8(%RDI,%R9,8),%R10 |
(4033) 0x4cdbb9 MOV %R10,%RCX |
(4033) 0x4cdbbc SUB %RAX,%RCX |
(4033) 0x4cdbbf JLE 4cdb90 |
(4033) 0x4cdbc1 MOV -0x48(%RBP),%RDX |
(4033) 0x4cdbc5 MOV (%RDX),%R11 |
(4033) 0x4cdbc8 MOV 0x20(%RBP),%RDX |
(4033) 0x4cdbcc MOV (%RDX),%R12 |
(4033) 0x4cdbcf MOV 0x10(%RBP),%RDX |
(4033) 0x4cdbd3 MOV (%RDX),%R13 |
(4033) 0x4cdbd6 MOV %RCX,%RDX |
(4033) 0x4cdbd9 AND $-0x4,%RDX |
(4033) 0x4cdbdd JE 4cdc56 |
(4033) 0x4cdbdf LEA -0x1(%RDX),%RBX |
(4033) 0x4cdbe3 LEA (%R11,%RAX,8),%RSI |
(4033) 0x4cdbe7 LEA (%R13,%RAX,8),%R14 |
(4033) 0x4cdbec VXORPD %XMM1,%XMM1,%XMM1 |
(4033) 0x4cdbf0 XOR %R15D,%R15D |
(4033) 0x4cdbf3 NOPW %CS:(%RAX,%RAX,1) |
(4035) 0x4cdc00 VMOVUPD (%R14,%R15,8),%YMM2 |
(4035) 0x4cdc06 KXNORW %K0,%K0,%K1 |
(4035) 0x4cdc0a VXORPD %XMM3,%XMM3,%XMM3 |
(4035) 0x4cdc0e VGATHERQPD (%R12,%YMM2,8),%YMM3{%K1} |
(4035) 0x4cdc15 VFMADD231PD (%RSI,%R15,8),%YMM3,%YMM1 |
(4035) 0x4cdc1b ADD $0x4,%R15 |
(4035) 0x4cdc1f CMP %RBX,%R15 |
(4035) 0x4cdc22 JBE 4cdc00 |
(4033) 0x4cdc24 VEXTRACTF128 $0x1,%YMM1,%XMM2 |
(4033) 0x4cdc2a VADDPD %XMM2,%XMM1,%XMM1 |
(4033) 0x4cdc2e VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(4033) 0x4cdc33 VADDSD %XMM2,%XMM1,%XMM1 |
(4033) 0x4cdc37 VADDSD %XMM1,%XMM0,%XMM0 |
(4033) 0x4cdc3b CMP %RDX,%RCX |
(4033) 0x4cdc3e MOV -0x40(%RBP),%R14 |
(4033) 0x4cdc42 MOV -0x38(%RBP),%R15 |
(4033) 0x4cdc46 MOV 0x28(%RBP),%RBX |
(4033) 0x4cdc4a MOV -0x30(%RBP),%RSI |
(4033) 0x4cdc4e JE 4cdb90 |
(4033) 0x4cdc54 JMP 4cdc58 |
(4033) 0x4cdc56 XOR %EDX,%EDX |
(4033) 0x4cdc58 ADD %RAX,%RDX |
(4033) 0x4cdc5b NOPL (%RAX,%RAX,1) |
(4034) 0x4cdc60 MOV (%R13,%RDX,8),%RAX |
(4034) 0x4cdc65 VMOVSD (%R12,%RAX,8),%XMM1 |
(4034) 0x4cdc6b VFMADD231SD (%R11,%RDX,8),%XMM1,%XMM0 |
(4034) 0x4cdc71 INC %RDX |
(4034) 0x4cdc74 CMP %RDX,%R10 |
(4034) 0x4cdc77 JNE 4cdc60 |
(4033) 0x4cdc79 JMP 4cdb90 |
0x4cdc7e VUCOMISD 0x152aa(%RIP),%XMM0 |
0x4cdc86 JNE 4cdfee |
0x4cdc8c CMP %R15,%R14 |
0x4cdc8f JGE 4ce20e |
0x4cdc95 MOV (%R12),%RDI |
0x4cdc99 MOV (%RSI),%RSI |
0x4cdc9c MOV %R14,%RAX |
0x4cdc9f NOT %RAX |
0x4cdca2 ADD %RAX,%R15 |
0x4cdca5 XOR %R8D,%R8D |
0x4cdca8 VMOVDDUP 0x15030(%RIP),%XMM0 |
0x4cdcb0 MOV %R15,-0x38(%RBP) |
0x4cdcb4 MOV %RSI,-0x30(%RBP) |
0x4cdcb8 JMP 4cdcd6 |
0x4cdcba NOPW (%RAX,%RAX,1) |
(4039) 0x4cdcc0 VMOVSD %XMM1,(%RSI,%R9,8) |
(4039) 0x4cdcc6 LEA 0x1(%R8),%RAX |
(4039) 0x4cdcca CMP %R15,%R8 |
(4039) 0x4cdccd MOV %RAX,%R8 |
(4039) 0x4cdcd0 JE 4ce20e |
(4039) 0x4cdcd6 LEA (%R14,%R8,1),%R9 |
(4039) 0x4cdcda VMOVSD (%RBX,%R9,8),%XMM1 |
(4039) 0x4cdce0 VXORPD %XMM0,%XMM1,%XMM1 |
(4039) 0x4cdce4 MOV (%RDI,%R9,8),%RAX |
(4039) 0x4cdce8 MOV 0x8(%RDI,%R9,8),%R10 |
(4039) 0x4cdced MOV %R10,%RCX |
(4039) 0x4cdcf0 SUB %RAX,%RCX |
(4039) 0x4cdcf3 JLE 4cdcc0 |
(4039) 0x4cdcf5 MOV -0x48(%RBP),%RDX |
(4039) 0x4cdcf9 MOV (%RDX),%R11 |
(4039) 0x4cdcfc MOV 0x20(%RBP),%RDX |
(4039) 0x4cdd00 MOV (%RDX),%R12 |
(4039) 0x4cdd03 MOV 0x10(%RBP),%RDX |
(4039) 0x4cdd07 MOV (%RDX),%R13 |
(4039) 0x4cdd0a MOV %RCX,%RDX |
(4039) 0x4cdd0d AND $-0x4,%RDX |
(4039) 0x4cdd11 JE 4cdd86 |
(4039) 0x4cdd13 LEA -0x1(%RDX),%RBX |
(4039) 0x4cdd17 LEA (%R11,%RAX,8),%RSI |
(4039) 0x4cdd1b LEA (%R13,%RAX,8),%R14 |
(4039) 0x4cdd20 VXORPD %XMM2,%XMM2,%XMM2 |
(4039) 0x4cdd24 XOR %R15D,%R15D |
(4039) 0x4cdd27 NOPW (%RAX,%RAX,1) |
(4041) 0x4cdd30 VMOVUPD (%R14,%R15,8),%YMM3 |
(4041) 0x4cdd36 VXORPD %XMM4,%XMM4,%XMM4 |
(4041) 0x4cdd3a KXNORW %K0,%K0,%K1 |
(4041) 0x4cdd3e VGATHERQPD (%R12,%YMM3,8),%YMM4{%K1} |
(4041) 0x4cdd45 VFNMADD231PD (%RSI,%R15,8),%YMM4,%YMM2 |
(4041) 0x4cdd4b ADD $0x4,%R15 |
(4041) 0x4cdd4f CMP %RBX,%R15 |
(4041) 0x4cdd52 JBE 4cdd30 |
(4039) 0x4cdd54 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4039) 0x4cdd5a VADDPD %XMM3,%XMM2,%XMM2 |
(4039) 0x4cdd5e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4039) 0x4cdd63 VADDSD %XMM3,%XMM2,%XMM2 |
(4039) 0x4cdd67 VADDSD %XMM2,%XMM1,%XMM1 |
(4039) 0x4cdd6b CMP %RDX,%RCX |
(4039) 0x4cdd6e MOV -0x40(%RBP),%R14 |
(4039) 0x4cdd72 MOV -0x38(%RBP),%R15 |
(4039) 0x4cdd76 MOV 0x28(%RBP),%RBX |
(4039) 0x4cdd7a MOV -0x30(%RBP),%RSI |
(4039) 0x4cdd7e JE 4cdcc0 |
(4039) 0x4cdd84 JMP 4cdd88 |
(4039) 0x4cdd86 XOR %EDX,%EDX |
(4039) 0x4cdd88 ADD %RAX,%RDX |
(4039) 0x4cdd8b NOPL (%RAX,%RAX,1) |
(4040) 0x4cdd90 MOV (%R13,%RDX,8),%RAX |
(4040) 0x4cdd95 VMOVSD (%R12,%RAX,8),%XMM2 |
(4040) 0x4cdd9b VFNMADD231SD (%R11,%RDX,8),%XMM2,%XMM1 |
(4040) 0x4cdda1 INC %RDX |
(4040) 0x4cdda4 CMP %RDX,%R10 |
(4040) 0x4cdda7 JNE 4cdd90 |
(4039) 0x4cdda9 JMP 4cdcc0 |
0x4cddae CMP %R15,%R14 |
0x4cddb1 JGE 4ce20e |
0x4cddb7 MOV (%R12),%RDI |
0x4cddbb MOV (%RSI),%RSI |
0x4cddbe MOV %R14,%RAX |
0x4cddc1 NOT %RAX |
0x4cddc4 ADD %RAX,%R15 |
0x4cddc7 XOR %R8D,%R8D |
0x4cddca VMOVDDUP 0x14f0e(%RIP),%XMM1 |
0x4cddd2 MOV %R15,-0x38(%RBP) |
0x4cddd6 MOV %RSI,-0x30(%RBP) |
0x4cddda JMP 4cddfa |
0x4cdddc NOPL (%RAX) |
(4045) 0x4cdde0 VMULSD %XMM0,%XMM2,%XMM2 |
(4045) 0x4cdde4 VMOVSD %XMM2,(%RSI,%R9,8) |
(4045) 0x4cddea LEA 0x1(%R8),%RAX |
(4045) 0x4cddee CMP %R15,%R8 |
(4045) 0x4cddf1 MOV %RAX,%R8 |
(4045) 0x4cddf4 JE 4ce20e |
(4045) 0x4cddfa LEA (%R14,%R8,1),%R9 |
(4045) 0x4cddfe VMOVSD (%RBX,%R9,8),%XMM2 |
(4045) 0x4cde04 VXORPD %XMM1,%XMM2,%XMM2 |
(4045) 0x4cde08 MOV (%RDI,%R9,8),%RAX |
(4045) 0x4cde0c MOV 0x8(%RDI,%R9,8),%R10 |
(4045) 0x4cde11 MOV %R10,%RCX |
(4045) 0x4cde14 SUB %RAX,%RCX |
(4045) 0x4cde17 JLE 4cdde0 |
(4045) 0x4cde19 MOV -0x48(%RBP),%RDX |
(4045) 0x4cde1d MOV (%RDX),%R11 |
(4045) 0x4cde20 MOV 0x20(%RBP),%RDX |
(4045) 0x4cde24 MOV (%RDX),%R12 |
(4045) 0x4cde27 MOV 0x10(%RBP),%RDX |
(4045) 0x4cde2b MOV (%RDX),%R13 |
(4045) 0x4cde2e MOV %RCX,%RDX |
(4045) 0x4cde31 AND $-0x4,%RDX |
(4045) 0x4cde35 JE 4cdea6 |
(4045) 0x4cde37 LEA -0x1(%RDX),%RBX |
(4045) 0x4cde3b LEA (%R11,%RAX,8),%RSI |
(4045) 0x4cde3f LEA (%R13,%RAX,8),%R14 |
(4045) 0x4cde44 VXORPD %XMM3,%XMM3,%XMM3 |
(4045) 0x4cde48 XOR %R15D,%R15D |
(4045) 0x4cde4b NOPL (%RAX,%RAX,1) |
(4047) 0x4cde50 VMOVUPD (%R14,%R15,8),%YMM4 |
(4047) 0x4cde56 VXORPD %XMM5,%XMM5,%XMM5 |
(4047) 0x4cde5a KXNORW %K0,%K0,%K1 |
(4047) 0x4cde5e VGATHERQPD (%R12,%YMM4,8),%YMM5{%K1} |
(4047) 0x4cde65 VFMADD231PD (%RSI,%R15,8),%YMM5,%YMM3 |
(4047) 0x4cde6b ADD $0x4,%R15 |
(4047) 0x4cde6f CMP %RBX,%R15 |
(4047) 0x4cde72 JBE 4cde50 |
(4045) 0x4cde74 VEXTRACTF128 $0x1,%YMM3,%XMM4 |
(4045) 0x4cde7a VADDPD %XMM4,%XMM3,%XMM3 |
(4045) 0x4cde7e VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(4045) 0x4cde83 VADDSD %XMM4,%XMM3,%XMM3 |
(4045) 0x4cde87 VADDSD %XMM3,%XMM2,%XMM2 |
(4045) 0x4cde8b CMP %RDX,%RCX |
(4045) 0x4cde8e MOV -0x40(%RBP),%R14 |
(4045) 0x4cde92 MOV -0x38(%RBP),%R15 |
(4045) 0x4cde96 MOV 0x28(%RBP),%RBX |
(4045) 0x4cde9a MOV -0x30(%RBP),%RSI |
(4045) 0x4cde9e JE 4cdde0 |
(4045) 0x4cdea4 JMP 4cdea8 |
(4045) 0x4cdea6 XOR %EDX,%EDX |
(4045) 0x4cdea8 ADD %RAX,%RDX |
(4045) 0x4cdeab NOPL (%RAX,%RAX,1) |
(4046) 0x4cdeb0 MOV (%R13,%RDX,8),%RAX |
(4046) 0x4cdeb5 VMOVSD (%R12,%RAX,8),%XMM3 |
(4046) 0x4cdebb VFMADD231SD (%R11,%RDX,8),%XMM3,%XMM2 |
(4046) 0x4cdec1 INC %RDX |
(4046) 0x4cdec4 CMP %RDX,%R10 |
(4046) 0x4cdec7 JNE 4cdeb0 |
(4045) 0x4cdec9 JMP 4cdde0 |
0x4cdece VUCOMISD 0x1505a(%RIP),%XMM0 |
0x4cded6 JNE 4ce0fe |
0x4cdedc CMP %R15,%R14 |
0x4cdedf JGE 4ce20e |
0x4cdee5 VXORPD 0x14df1(%RIP){1to2},%XMM5,%XMM0 |
0x4cdeef MOV (%R12),%RDI |
0x4cdef3 MOV (%RSI),%RDX |
0x4cdef6 MOV %R14,%RAX |
0x4cdef9 NOT %RAX |
0x4cdefc ADD %RAX,%R15 |
0x4cdeff XOR %R8D,%R8D |
0x4cdf02 MOV %R15,-0x38(%RBP) |
0x4cdf06 MOV %RDX,-0x30(%RBP) |
0x4cdf0a JMP 4cdf22 |
(4030) 0x4cdf0c VMOVSD %XMM1,(%RDX,%R9,8) |
(4030) 0x4cdf12 LEA 0x1(%R8),%RAX |
(4030) 0x4cdf16 CMP %R15,%R8 |
(4030) 0x4cdf19 MOV %RAX,%R8 |
(4030) 0x4cdf1c JE 4ce20e |
(4030) 0x4cdf22 LEA (%R14,%R8,1),%R9 |
(4030) 0x4cdf26 VMULSD (%RBX,%R9,8),%XMM0,%XMM1 |
(4030) 0x4cdf2c MOV (%RDI,%R9,8),%RAX |
(4030) 0x4cdf30 MOV 0x8(%RDI,%R9,8),%R10 |
(4030) 0x4cdf35 MOV %R10,%RCX |
(4030) 0x4cdf38 SUB %RAX,%RCX |
(4030) 0x4cdf3b JLE 4cdf0c |
(4030) 0x4cdf3d MOV -0x48(%RBP),%RDX |
(4030) 0x4cdf41 MOV (%RDX),%R11 |
(4030) 0x4cdf44 MOV 0x20(%RBP),%RDX |
(4030) 0x4cdf48 MOV (%RDX),%R12 |
(4030) 0x4cdf4b MOV 0x10(%RBP),%RDX |
(4030) 0x4cdf4f MOV (%RDX),%R13 |
(4030) 0x4cdf52 MOV %RCX,%RSI |
(4030) 0x4cdf55 AND $-0x4,%RSI |
(4030) 0x4cdf59 JE 4cdfc6 |
(4030) 0x4cdf5b LEA -0x1(%RSI),%RDX |
(4030) 0x4cdf5f LEA (%R11,%RAX,8),%RBX |
(4030) 0x4cdf63 LEA (%R13,%RAX,8),%R14 |
(4030) 0x4cdf68 VXORPD %XMM2,%XMM2,%XMM2 |
(4030) 0x4cdf6c XOR %R15D,%R15D |
(4030) 0x4cdf6f NOP |
(4032) 0x4cdf70 VMOVUPD (%R14,%R15,8),%YMM3 |
(4032) 0x4cdf76 VXORPD %XMM4,%XMM4,%XMM4 |
(4032) 0x4cdf7a KXNORW %K0,%K0,%K1 |
(4032) 0x4cdf7e VGATHERQPD (%R12,%YMM3,8),%YMM4{%K1} |
(4032) 0x4cdf85 VFNMADD231PD (%RBX,%R15,8),%YMM4,%YMM2 |
(4032) 0x4cdf8b ADD $0x4,%R15 |
(4032) 0x4cdf8f CMP %RDX,%R15 |
(4032) 0x4cdf92 JBE 4cdf70 |
(4030) 0x4cdf94 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4030) 0x4cdf9a VADDPD %XMM3,%XMM2,%XMM2 |
(4030) 0x4cdf9e VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4030) 0x4cdfa3 VADDSD %XMM3,%XMM2,%XMM2 |
(4030) 0x4cdfa7 VADDSD %XMM2,%XMM1,%XMM1 |
(4030) 0x4cdfab CMP %RSI,%RCX |
(4030) 0x4cdfae MOV -0x40(%RBP),%R14 |
(4030) 0x4cdfb2 MOV -0x38(%RBP),%R15 |
(4030) 0x4cdfb6 MOV 0x28(%RBP),%RBX |
(4030) 0x4cdfba MOV -0x30(%RBP),%RDX |
(4030) 0x4cdfbe JE 4cdf0c |
(4030) 0x4cdfc4 JMP 4cdfcc |
(4030) 0x4cdfc6 XOR %ESI,%ESI |
(4030) 0x4cdfc8 MOV -0x30(%RBP),%RDX |
(4030) 0x4cdfcc ADD %RAX,%RSI |
(4030) 0x4cdfcf NOP |
(4031) 0x4cdfd0 MOV (%R13,%RSI,8),%RAX |
(4031) 0x4cdfd5 VMOVSD (%R12,%RAX,8),%XMM2 |
(4031) 0x4cdfdb VFNMADD231SD (%R11,%RSI,8),%XMM2,%XMM1 |
(4031) 0x4cdfe1 INC %RSI |
(4031) 0x4cdfe4 CMP %RSI,%R10 |
(4031) 0x4cdfe7 JNE 4cdfd0 |
(4030) 0x4cdfe9 JMP 4cdf0c |
0x4cdfee CMP %R15,%R14 |
0x4cdff1 JGE 4ce20e |
0x4cdff7 MOV (%R12),%RDI |
0x4cdffb MOV (%RSI),%RSI |
0x4cdffe MOV %R14,%RAX |
0x4ce001 NOT %RAX |
0x4ce004 ADD %RAX,%R15 |
0x4ce007 XOR %R8D,%R8D |
0x4ce00a MOV %R15,-0x38(%RBP) |
0x4ce00e MOV %RSI,-0x30(%RBP) |
0x4ce012 JMP 4ce02e |
(4036) 0x4ce014 VMULSD %XMM0,%XMM1,%XMM1 |
(4036) 0x4ce018 VMOVSD %XMM1,(%RSI,%R9,8) |
(4036) 0x4ce01e LEA 0x1(%R8),%RAX |
(4036) 0x4ce022 CMP %R15,%R8 |
(4036) 0x4ce025 MOV %RAX,%R8 |
(4036) 0x4ce028 JE 4ce20e |
(4036) 0x4ce02e LEA (%R14,%R8,1),%R9 |
(4036) 0x4ce032 VMOVSD (%RBX,%R9,8),%XMM1 |
(4036) 0x4ce038 MOV (%RDI,%R9,8),%RAX |
(4036) 0x4ce03c MOV 0x8(%RDI,%R9,8),%R10 |
(4036) 0x4ce041 MOV %R10,%RCX |
(4036) 0x4ce044 SUB %RAX,%RCX |
(4036) 0x4ce047 JLE 4ce014 |
(4036) 0x4ce049 MOV -0x48(%RBP),%RDX |
(4036) 0x4ce04d MOV (%RDX),%R11 |
(4036) 0x4ce050 MOV 0x20(%RBP),%RDX |
(4036) 0x4ce054 MOV (%RDX),%R12 |
(4036) 0x4ce057 MOV 0x10(%RBP),%RDX |
(4036) 0x4ce05b MOV (%RDX),%R13 |
(4036) 0x4ce05e MOV %RCX,%RDX |
(4036) 0x4ce061 AND $-0x4,%RDX |
(4036) 0x4ce065 JE 4ce0d6 |
(4036) 0x4ce067 LEA -0x1(%RDX),%RBX |
(4036) 0x4ce06b LEA (%R11,%RAX,8),%RSI |
(4036) 0x4ce06f LEA (%R13,%RAX,8),%R14 |
(4036) 0x4ce074 VXORPD %XMM2,%XMM2,%XMM2 |
(4036) 0x4ce078 XOR %R15D,%R15D |
(4036) 0x4ce07b NOPL (%RAX,%RAX,1) |
(4038) 0x4ce080 VMOVUPD (%R14,%R15,8),%YMM3 |
(4038) 0x4ce086 KXNORW %K0,%K0,%K1 |
(4038) 0x4ce08a VXORPD %XMM4,%XMM4,%XMM4 |
(4038) 0x4ce08e VGATHERQPD (%R12,%YMM3,8),%YMM4{%K1} |
(4038) 0x4ce095 VFMADD231PD (%RSI,%R15,8),%YMM4,%YMM2 |
(4038) 0x4ce09b ADD $0x4,%R15 |
(4038) 0x4ce09f CMP %RBX,%R15 |
(4038) 0x4ce0a2 JBE 4ce080 |
(4036) 0x4ce0a4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4036) 0x4ce0aa VADDPD %XMM3,%XMM2,%XMM2 |
(4036) 0x4ce0ae VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4036) 0x4ce0b3 VADDSD %XMM3,%XMM2,%XMM2 |
(4036) 0x4ce0b7 VADDSD %XMM2,%XMM1,%XMM1 |
(4036) 0x4ce0bb CMP %RDX,%RCX |
(4036) 0x4ce0be MOV -0x40(%RBP),%R14 |
(4036) 0x4ce0c2 MOV -0x38(%RBP),%R15 |
(4036) 0x4ce0c6 MOV 0x28(%RBP),%RBX |
(4036) 0x4ce0ca MOV -0x30(%RBP),%RSI |
(4036) 0x4ce0ce JE 4ce014 |
(4036) 0x4ce0d4 JMP 4ce0d8 |
(4036) 0x4ce0d6 XOR %EDX,%EDX |
(4036) 0x4ce0d8 ADD %RAX,%RDX |
(4036) 0x4ce0db NOPL (%RAX,%RAX,1) |
(4037) 0x4ce0e0 MOV (%R13,%RDX,8),%RAX |
(4037) 0x4ce0e5 VMOVSD (%R12,%RAX,8),%XMM2 |
(4037) 0x4ce0eb VFMADD231SD (%R11,%RDX,8),%XMM2,%XMM1 |
(4037) 0x4ce0f1 INC %RDX |
(4037) 0x4ce0f4 CMP %RDX,%R10 |
(4037) 0x4ce0f7 JNE 4ce0e0 |
(4036) 0x4ce0f9 JMP 4ce014 |
0x4ce0fe CMP %R15,%R14 |
0x4ce101 JGE 4ce20e |
0x4ce107 MOV (%R12),%RDI |
0x4ce10b MOV (%RSI),%RDX |
0x4ce10e MOV %R14,%RAX |
0x4ce111 NOT %RAX |
0x4ce114 ADD %RAX,%R15 |
0x4ce117 XOR %R8D,%R8D |
0x4ce11a MOV %R15,-0x38(%RBP) |
0x4ce11e MOV %RDX,-0x30(%RBP) |
0x4ce122 JMP 4ce13e |
(4027) 0x4ce124 VMULSD %XMM0,%XMM1,%XMM1 |
(4027) 0x4ce128 VMOVSD %XMM1,(%RDX,%R9,8) |
(4027) 0x4ce12e LEA 0x1(%R8),%RAX |
(4027) 0x4ce132 CMP %R15,%R8 |
(4027) 0x4ce135 MOV %RAX,%R8 |
(4027) 0x4ce138 JE 4ce20e |
(4027) 0x4ce13e LEA (%R14,%R8,1),%R9 |
(4027) 0x4ce142 VMULSD (%RBX,%R9,8),%XMM5,%XMM1 |
(4027) 0x4ce148 MOV (%RDI,%R9,8),%RAX |
(4027) 0x4ce14c MOV 0x8(%RDI,%R9,8),%R10 |
(4027) 0x4ce151 MOV %R10,%RCX |
(4027) 0x4ce154 SUB %RAX,%RCX |
(4027) 0x4ce157 JLE 4ce124 |
(4027) 0x4ce159 MOV -0x48(%RBP),%RDX |
(4027) 0x4ce15d MOV (%RDX),%R11 |
(4027) 0x4ce160 MOV 0x20(%RBP),%RDX |
(4027) 0x4ce164 MOV (%RDX),%R12 |
(4027) 0x4ce167 MOV 0x10(%RBP),%RDX |
(4027) 0x4ce16b MOV (%RDX),%R13 |
(4027) 0x4ce16e MOV %RCX,%RSI |
(4027) 0x4ce171 AND $-0x4,%RSI |
(4027) 0x4ce175 JE 4ce1e6 |
(4027) 0x4ce177 LEA -0x1(%RSI),%RDX |
(4027) 0x4ce17b LEA (%R11,%RAX,8),%RBX |
(4027) 0x4ce17f LEA (%R13,%RAX,8),%R14 |
(4027) 0x4ce184 VXORPD %XMM2,%XMM2,%XMM2 |
(4027) 0x4ce188 XOR %R15D,%R15D |
(4027) 0x4ce18b NOPL (%RAX,%RAX,1) |
(4029) 0x4ce190 VMOVUPD (%R14,%R15,8),%YMM3 |
(4029) 0x4ce196 VXORPD %XMM4,%XMM4,%XMM4 |
(4029) 0x4ce19a KXNORW %K0,%K0,%K1 |
(4029) 0x4ce19e VGATHERQPD (%R12,%YMM3,8),%YMM4{%K1} |
(4029) 0x4ce1a5 VFMADD231PD (%RBX,%R15,8),%YMM4,%YMM2 |
(4029) 0x4ce1ab ADD $0x4,%R15 |
(4029) 0x4ce1af CMP %RDX,%R15 |
(4029) 0x4ce1b2 JBE 4ce190 |
(4027) 0x4ce1b4 VEXTRACTF128 $0x1,%YMM2,%XMM3 |
(4027) 0x4ce1ba VADDPD %XMM3,%XMM2,%XMM2 |
(4027) 0x4ce1be VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(4027) 0x4ce1c3 VADDSD %XMM3,%XMM2,%XMM2 |
(4027) 0x4ce1c7 VADDSD %XMM2,%XMM1,%XMM1 |
(4027) 0x4ce1cb CMP %RSI,%RCX |
(4027) 0x4ce1ce MOV -0x40(%RBP),%R14 |
(4027) 0x4ce1d2 MOV -0x38(%RBP),%R15 |
(4027) 0x4ce1d6 MOV 0x28(%RBP),%RBX |
(4027) 0x4ce1da MOV -0x30(%RBP),%RDX |
(4027) 0x4ce1de JE 4ce124 |
(4027) 0x4ce1e4 JMP 4ce1ec |
(4027) 0x4ce1e6 XOR %ESI,%ESI |
(4027) 0x4ce1e8 MOV -0x30(%RBP),%RDX |
(4027) 0x4ce1ec ADD %RAX,%RSI |
(4027) 0x4ce1ef NOP |
(4028) 0x4ce1f0 MOV (%R13,%RSI,8),%RAX |
(4028) 0x4ce1f5 VMOVSD (%R12,%RAX,8),%XMM2 |
(4028) 0x4ce1fb VFMADD231SD (%R11,%RSI,8),%XMM2,%XMM1 |
(4028) 0x4ce201 INC %RSI |
(4028) 0x4ce204 CMP %RSI,%R10 |
(4028) 0x4ce207 JNE 4ce1f0 |
(4027) 0x4ce209 JMP 4ce124 |
0x4ce20e ADD $0x28,%RSP |
0x4ce212 POP %RBX |
0x4ce213 POP %R12 |
0x4ce215 POP %R13 |
0x4ce217 POP %R14 |
0x4ce219 POP %R15 |
0x4ce21b POP %RBP |
0x4ce21c VZEROUPPER |
0x4ce21f RET |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 242 |
nb uops | 261 |
loop length | 991 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 8 |
micro-operation queue | 43.50 cycles |
front end | 43.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.40 | 17.67 | 17.67 | 20.00 | 19.40 | 20.00 | 20.00 | 20.00 | 20.00 | 19.20 | 17.67 |
cycles | 20.00 | 19.40 | 17.67 | 17.67 | 20.00 | 19.40 | 20.00 | 20.00 | 20.00 | 20.00 | 19.20 | 17.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 42.22 |
Stall cycles | 0.00 |
Front-end | 43.50 |
Dispatch | 20.00 |
Overall L1 | 43.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 2% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cbd60 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cbde0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4cd3b7 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x67> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24d870(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f653b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6ee1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4cd3c5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4cd3f3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24d834(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f6f68,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6ee1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4cd402 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4cd435 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24d7f7(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f6f8a,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6ee1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R14,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4cd56d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x21d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x14bd8(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd6ae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x35e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd4a6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x156> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x28(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x159b7(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd7cd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x47d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x14aa9(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd8fe <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x5ae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x1572f(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd5d6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x286> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1587a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cda2e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x6de> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd706 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x3b6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1485b(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdb4d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x1484d(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdc7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x92e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd826 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4d6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1562a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cddae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa5e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd956 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x606> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cda7a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x72a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x144db(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdece <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb7e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cdba6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x856> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x152aa(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdfee <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc9e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x15030(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cdcd6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x986> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x14f0e(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cddfa <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xaaa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1505a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4ce0fe <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x14df1(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cdf22 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbd2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ce02e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcde> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ce13e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 242 |
nb uops | 261 |
loop length | 991 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 8 |
micro-operation queue | 43.50 cycles |
front end | 43.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.40 | 17.67 | 17.67 | 20.00 | 19.40 | 20.00 | 20.00 | 20.00 | 20.00 | 19.20 | 17.67 |
cycles | 20.00 | 19.40 | 17.67 | 17.67 | 20.00 | 19.40 | 20.00 | 20.00 | 20.00 | 20.00 | 19.20 | 17.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 42.22 |
Stall cycles | 0.00 |
Front-end | 43.50 |
Dispatch | 20.00 |
Overall L1 | 43.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 2% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 2% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 4% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cbd60 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4cbde0 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4cd3b7 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x67> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24d870(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f653b,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6ee1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4cd3c5 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x75> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4cd3f3 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24d834(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f6f68,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6ee1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R15,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4cd402 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb2> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RBX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4cd435 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x24d7f7(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4f4525,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4f6f8a,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d58d0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4f6ee1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d8210 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM5 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R14,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4cd56d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x21d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x14bd8(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd6ae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x35e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd4a6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x156> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x28(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x159b7(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd7cd <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x47d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x14aa9(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cd8fe <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x5ae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x1572f(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd5d6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x286> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1587a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cda2e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x6de> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd706 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x3b6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1485b(%RIP),%XMM5 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdb4d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x7fd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x1484d(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdc7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x92e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd826 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4d6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1562a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cddae <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa5e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cd956 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x606> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cda7a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x72a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x144db(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdece <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb7e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cdba6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x856> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x152aa(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4cdfee <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc9e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x15030(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cdcd6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x986> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x14f0e(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cddfa <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xaaa> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x1505a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4ce0fe <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x14df1(%RIP){1to2},%XMM5,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4cdf22 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xbd2> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ce02e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xcde> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R15,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4ce20e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xebe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R12),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R15,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4ce13e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x28,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted– | 11.2 | 1.82 |
▼Loop 4042 - csr_matvec.c:248-341 - exec– | 0.85 | 0.12 |
○Loop 4043 - csr_matvec.c:337-339 - exec | 0.54 | 0.07 |
○Loop 4044 - csr_matvec.c:337-339 - exec | 0.14 | 0.02 |
▼Loop 4048 - csr_matvec.c:248-314 - exec– | 0.64 | 0.09 |
○Loop 4050 - csr_matvec.c:310-312 - exec | 3.83 | 0.52 |
○Loop 4049 - csr_matvec.c:310-312 - exec | 0.66 | 0.09 |
▼Loop 4060 - csr_matvec.c:248-263 - exec– | 0.51 | 0.07 |
○Loop 4062 - csr_matvec.c:259-261 - exec | 3.44 | 0.47 |
○Loop 4061 - csr_matvec.c:259-261 - exec | 0.6 | 0.08 |
▼Loop 4030 - csr_matvec.c:248-392 - exec– | 0 | 0 |
○Loop 4031 - csr_matvec.c:388-390 - exec | 0 | 0 |
○Loop 4032 - csr_matvec.c:388-390 - exec | 0 | 0 |
▼Loop 4027 - csr_matvec.c:248-404 - exec– | 0 | 0 |
○Loop 4029 - csr_matvec.c:400-402 - exec | 0 | 0 |
○Loop 4028 - csr_matvec.c:400-402 - exec | 0 | 0 |
▼Loop 4045 - csr_matvec.c:248-326 - exec– | 0 | 0 |
○Loop 4046 - csr_matvec.c:322-324 - exec | 0 | 0 |
○Loop 4047 - csr_matvec.c:322-324 - exec | 0 | 0 |
▼Loop 4033 - csr_matvec.c:248-380 - exec– | 0 | 0 |
○Loop 4035 - csr_matvec.c:376-378 - exec | 0 | 0 |
○Loop 4034 - csr_matvec.c:376-378 - exec | 0 | 0 |
▼Loop 4051 - csr_matvec.c:248-302 - exec– | 0 | 0 |
○Loop 4053 - csr_matvec.c:298-300 - exec | 0 | 0 |
○Loop 4052 - csr_matvec.c:298-300 - exec | 0 | 0 |
▼Loop 4054 - csr_matvec.c:248-287 - exec– | 0 | 0 |
○Loop 4055 - csr_matvec.c:283-285 - exec | 0 | 0 |
○Loop 4056 - csr_matvec.c:283-285 - exec | 0 | 0 |
▼Loop 4039 - csr_matvec.c:248-353 - exec– | 0 | 0 |
○Loop 4041 - csr_matvec.c:349-351 - exec | 0 | 0 |
○Loop 4040 - csr_matvec.c:349-351 - exec | 0 | 0 |
▼Loop 4036 - csr_matvec.c:248-365 - exec– | 0 | 0 |
○Loop 4037 - csr_matvec.c:361-363 - exec | 0 | 0 |
○Loop 4038 - csr_matvec.c:361-363 - exec | 0 | 0 |
▼Loop 4057 - csr_matvec.c:248-275 - exec– | 0 | 0 |
○Loop 4059 - csr_matvec.c:271-273 - exec | 0 | 0 |
○Loop 4058 - csr_matvec.c:271-273 - exec | 0 | 0 |