Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 18.58% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace.extracted | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 18.58% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-586-9096/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
0x4c7180 PUSH %RBP |
0x4c7181 MOV %RSP,%RBP |
0x4c7184 PUSH %R15 |
0x4c7186 PUSH %R14 |
0x4c7188 PUSH %R13 |
0x4c718a PUSH %R12 |
0x4c718c PUSH %RBX |
0x4c718d SUB $0x38,%RSP |
0x4c7191 MOV %R9,-0x30(%RBP) |
0x4c7195 MOV %R8,-0x58(%RBP) |
0x4c7199 MOV %RCX,%R15 |
0x4c719c MOV %RDX,%R13 |
0x4c719f MOV %RCX,%RDI |
0x4c71a2 CALL 4c5bc0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> |
0x4c71a7 MOV %RAX,%RBX |
0x4c71aa MOV %R15,%RDI |
0x4c71ad CALL 4c5c40 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> |
0x4c71b2 MOV %RAX,%R14 |
0x4c71b5 CMP %RAX,%RBX |
0x4c71b8 JLE 4c71e8 |
0x4c71ba MOV 0x5aa3f(%RIP),%RDI |
0x4c71c1 MOV $0x4fa05a,%ESI |
0x4c71c6 MOV $0x4fc003,%EDX |
0x4c71cb XOR %EAX,%EAX |
0x4c71cd CALL 4cf9e0 <hypre_fprintf> |
0x4c71d2 MOV $0x4fc999,%EDI |
0x4c71d7 MOV $0xf8,%ESI |
0x4c71dc MOV $0x1,%EDX |
0x4c71e1 XOR %ECX,%ECX |
0x4c71e3 CALL 4d2330 <hypre_error_handler> |
0x4c71e8 MOV 0x18(%RBP),%R12 |
0x4c71ec TEST %RBX,%RBX |
0x4c71ef JS 4c71f6 |
0x4c71f1 CMP %R12,%RBX |
0x4c71f4 JLE 4c7224 |
0x4c71f6 MOV 0x5aa03(%RIP),%RDI |
0x4c71fd MOV $0x4fa05a,%ESI |
0x4c7202 MOV $0x4fca1c,%EDX |
0x4c7207 XOR %EAX,%EAX |
0x4c7209 CALL 4cf9e0 <hypre_fprintf> |
0x4c720e MOV $0x4fc999,%EDI |
0x4c7213 MOV $0xf9,%ESI |
0x4c7218 MOV $0x1,%EDX |
0x4c721d XOR %ECX,%ECX |
0x4c721f CALL 4d2330 <hypre_error_handler> |
0x4c7224 VMOVSD 0x38(%RBP),%XMM4 |
0x4c7229 TEST %R14,%R14 |
0x4c722c JS 4c7233 |
0x4c722e CMP %R12,%R14 |
0x4c7231 JLE 4c7266 |
0x4c7233 MOV 0x5a9c6(%RIP),%RDI |
0x4c723a MOV $0x4fa05a,%ESI |
0x4c723f MOV $0x4fca3e,%EDX |
0x4c7244 XOR %EAX,%EAX |
0x4c7246 CALL 4cf9e0 <hypre_fprintf> |
0x4c724b MOV $0x4fc999,%EDI |
0x4c7250 MOV $0xfa,%ESI |
0x4c7255 MOV $0x1,%EDX |
0x4c725a XOR %ECX,%ECX |
0x4c725c CALL 4d2330 <hypre_error_handler> |
0x4c7261 VMOVSD 0x38(%RBP),%XMM4 |
0x4c7266 MOV 0x30(%RBP),%RSI |
0x4c726a VMOVQ %R13,%XMM0 |
0x4c726f VXORPD %XMM1,%XMM1,%XMM1 |
0x4c7273 VUCOMISD %XMM1,%XMM4 |
0x4c7277 MOV %RBX,-0x50(%RBP) |
0x4c727b JNE 4c73ad |
0x4c7281 VUCOMISD 0x20d87(%RIP),%XMM0 |
0x4c7289 JNE 4c750e |
0x4c728f CMP %R14,%RBX |
0x4c7292 JGE 4c813e |
0x4c7298 MOV -0x30(%RBP),%RAX |
0x4c729c MOV (%RAX),%RDX |
0x4c729f MOV (%RSI),%RSI |
0x4c72a2 MOV %RBX,%RAX |
0x4c72a5 NOT %RAX |
0x4c72a8 ADD %RAX,%R14 |
0x4c72ab XOR %EDI,%EDI |
0x4c72ad MOV %R14,-0x30(%RBP) |
0x4c72b1 MOV %RDX,-0x48(%RBP) |
0x4c72b5 MOV %RSI,-0x40(%RBP) |
0x4c72b9 JMP 4c72d6 |
0x4c72bb NOPL (%RAX,%RAX,1) |
(3811) 0x4c72c0 VMOVSD %XMM0,(%RSI,%R8,8) |
(3811) 0x4c72c6 LEA 0x1(%RDI),%RAX |
(3811) 0x4c72ca CMP %R14,%RDI |
(3811) 0x4c72cd MOV %RAX,%RDI |
(3811) 0x4c72d0 JE 4c813e |
(3811) 0x4c72d6 LEA (%RBX,%RDI,1),%R8 |
(3811) 0x4c72da MOV (%RDX,%R8,8),%R15 |
(3811) 0x4c72de MOV 0x8(%RDX,%R8,8),%R9 |
(3811) 0x4c72e3 VXORPD %XMM0,%XMM0,%XMM0 |
(3811) 0x4c72e7 MOV %R9,%RCX |
(3811) 0x4c72ea SUB %R15,%RCX |
(3811) 0x4c72ed JLE 4c72c0 |
(3811) 0x4c72ef MOV -0x58(%RBP),%RAX |
(3811) 0x4c72f3 MOV (%RAX),%R10 |
(3811) 0x4c72f6 MOV 0x20(%RBP),%RAX |
(3811) 0x4c72fa MOV (%RAX),%R11 |
(3811) 0x4c72fd MOV 0x10(%RBP),%RAX |
(3811) 0x4c7301 MOV (%RAX),%R12 |
(3811) 0x4c7304 MOV %RCX,%R13 |
(3811) 0x4c7307 AND $-0x2,%R13 |
(3811) 0x4c730b JE 4c737c |
(3811) 0x4c730d LEA -0x1(%R13),%RBX |
(3811) 0x4c7311 LEA (%R10,%R15,8),%R14 |
(3811) 0x4c7315 MOV %R15,-0x38(%RBP) |
(3811) 0x4c7319 LEA (%R12,%R15,8),%R15 |
(3811) 0x4c731d VXORPD %XMM0,%XMM0,%XMM0 |
(3811) 0x4c7321 XOR %ESI,%ESI |
(3811) 0x4c7323 NOPW %CS:(%RAX,%RAX,1) |
(3813) 0x4c7330 MOV (%R15,%RSI,8),%RDX |
(3813) 0x4c7334 MOV 0x8(%R15,%RSI,8),%RAX |
(3813) 0x4c7339 VMOVSD (%R11,%RDX,8),%XMM1 |
(3813) 0x4c733f VMOVHPD (%R11,%RAX,8),%XMM1,%XMM1 |
(3813) 0x4c7345 VFMADD231PD (%R14,%RSI,8),%XMM1,%XMM0 |
(3813) 0x4c734b ADD $0x2,%RSI |
(3813) 0x4c734f CMP %RBX,%RSI |
(3813) 0x4c7352 JBE 4c7330 |
(3811) 0x4c7354 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(3811) 0x4c7359 VADDSD %XMM1,%XMM0,%XMM0 |
(3811) 0x4c735d CMP %R13,%RCX |
(3811) 0x4c7360 MOV -0x50(%RBP),%RBX |
(3811) 0x4c7364 MOV -0x30(%RBP),%R14 |
(3811) 0x4c7368 MOV -0x48(%RBP),%RDX |
(3811) 0x4c736c MOV -0x40(%RBP),%RSI |
(3811) 0x4c7370 MOV -0x38(%RBP),%R15 |
(3811) 0x4c7374 JE 4c72c0 |
(3811) 0x4c737a JMP 4c737f |
(3811) 0x4c737c XOR %R13D,%R13D |
(3811) 0x4c737f ADD %R15,%R13 |
(3811) 0x4c7382 NOPW %CS:(%RAX,%RAX,1) |
(3812) 0x4c7390 MOV (%R12,%R13,8),%RAX |
(3812) 0x4c7394 VMOVSD (%R11,%RAX,8),%XMM1 |
(3812) 0x4c739a VFMADD231SD (%R10,%R13,8),%XMM1,%XMM0 |
(3812) 0x4c73a0 INC %R13 |
(3812) 0x4c73a3 CMP %R13,%R9 |
(3812) 0x4c73a6 JNE 4c7390 |
(3811) 0x4c73a8 JMP 4c72c0 |
0x4c73ad MOV 0x28(%RBP),%RDI |
0x4c73b1 VUCOMISD 0x21b67(%RIP),%XMM4 |
0x4c73b9 JNE 4c763d |
0x4c73bf VUCOMISD 0x20c49(%RIP),%XMM0 |
0x4c73c7 JNE 4c778e |
0x4c73cd CMP %R14,%RBX |
0x4c73d0 JGE 4c813e |
0x4c73d6 MOV -0x30(%RBP),%RAX |
0x4c73da MOV (%RAX),%R15 |
0x4c73dd MOV (%RSI),%RSI |
0x4c73e0 MOV %RBX,%RAX |
0x4c73e3 NOT %RAX |
0x4c73e6 ADD %RAX,%R14 |
0x4c73e9 XOR %R8D,%R8D |
0x4c73ec VMOVDDUP 0x23294(%RIP),%XMM0 |
0x4c73f4 MOV %R14,-0x30(%RBP) |
0x4c73f8 MOV %R15,-0x48(%RBP) |
0x4c73fc MOV %RSI,-0x40(%RBP) |
0x4c7400 JMP 4c7426 |
0x4c7402 NOPW %CS:(%RAX,%RAX,1) |
(3802) 0x4c7410 VMOVSD %XMM1,(%RSI,%R9,8) |
(3802) 0x4c7416 LEA 0x1(%R8),%RAX |
(3802) 0x4c741a CMP %R14,%R8 |
(3802) 0x4c741d MOV %RAX,%R8 |
(3802) 0x4c7420 JE 4c813e |
(3802) 0x4c7426 LEA (%RBX,%R8,1),%R9 |
(3802) 0x4c742a VMOVSD (%RDI,%R9,8),%XMM1 |
(3802) 0x4c7430 VXORPD %XMM0,%XMM1,%XMM1 |
(3802) 0x4c7434 MOV (%R15,%R9,8),%RAX |
(3802) 0x4c7438 MOV 0x8(%R15,%R9,8),%R10 |
(3802) 0x4c743d MOV %R10,%RCX |
(3802) 0x4c7440 SUB %RAX,%RCX |
(3802) 0x4c7443 JLE 4c7410 |
(3802) 0x4c7445 MOV %RAX,-0x38(%RBP) |
(3802) 0x4c7449 MOV -0x58(%RBP),%RAX |
(3802) 0x4c744d MOV (%RAX),%R11 |
(3802) 0x4c7450 MOV 0x20(%RBP),%RAX |
(3802) 0x4c7454 MOV (%RAX),%R12 |
(3802) 0x4c7457 MOV 0x10(%RBP),%RAX |
(3802) 0x4c745b MOV (%RAX),%R13 |
(3802) 0x4c745e MOV %RCX,%RDX |
(3802) 0x4c7461 AND $-0x2,%RDX |
(3802) 0x4c7465 JE 4c74e0 |
(3802) 0x4c7467 LEA -0x1(%RDX),%RBX |
(3802) 0x4c746b MOV -0x38(%RBP),%RAX |
(3802) 0x4c746f LEA (%R11,%RAX,8),%R14 |
(3802) 0x4c7473 LEA (,%RAX,8),%R15 |
(3802) 0x4c747b ADD %R13,%R15 |
(3802) 0x4c747e VXORPD %XMM2,%XMM2,%XMM2 |
(3802) 0x4c7482 XOR %ESI,%ESI |
(3802) 0x4c7484 NOPW %CS:(%RAX,%RAX,1) |
(3804) 0x4c7490 MOV (%R15,%RSI,8),%RDI |
(3804) 0x4c7494 MOV 0x8(%R15,%RSI,8),%RAX |
(3804) 0x4c7499 VMOVSD (%R12,%RDI,8),%XMM3 |
(3804) 0x4c749f VMOVHPD (%R12,%RAX,8),%XMM3,%XMM3 |
(3804) 0x4c74a5 VFMADD231PD (%R14,%RSI,8),%XMM3,%XMM2 |
(3804) 0x4c74ab ADD $0x2,%RSI |
(3804) 0x4c74af CMP %RBX,%RSI |
(3804) 0x4c74b2 JBE 4c7490 |
(3802) 0x4c74b4 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(3802) 0x4c74b9 VADDSD %XMM3,%XMM2,%XMM2 |
(3802) 0x4c74bd VADDSD %XMM2,%XMM1,%XMM1 |
(3802) 0x4c74c1 CMP %RDX,%RCX |
(3802) 0x4c74c4 MOV -0x50(%RBP),%RBX |
(3802) 0x4c74c8 MOV -0x30(%RBP),%R14 |
(3802) 0x4c74cc MOV 0x28(%RBP),%RDI |
(3802) 0x4c74d0 MOV -0x48(%RBP),%R15 |
(3802) 0x4c74d4 MOV -0x40(%RBP),%RSI |
(3802) 0x4c74d8 JE 4c7410 |
(3802) 0x4c74de JMP 4c74e2 |
(3802) 0x4c74e0 XOR %EDX,%EDX |
(3802) 0x4c74e2 ADD -0x38(%RBP),%RDX |
(3802) 0x4c74e6 NOPW %CS:(%RAX,%RAX,1) |
(3803) 0x4c74f0 MOV (%R13,%RDX,8),%RAX |
(3803) 0x4c74f5 VMOVSD (%R12,%RAX,8),%XMM2 |
(3803) 0x4c74fb VFMADD231SD (%R11,%RDX,8),%XMM2,%XMM1 |
(3803) 0x4c7501 INC %RDX |
(3803) 0x4c7504 CMP %RDX,%R10 |
(3803) 0x4c7507 JNE 4c74f0 |
(3802) 0x4c7509 JMP 4c7410 |
0x4c750e VUCOMISD 0x21a0a(%RIP),%XMM0 |
0x4c7516 JNE 4c78ce |
0x4c751c CMP %R14,%RBX |
0x4c751f JGE 4c813e |
0x4c7525 MOV -0x30(%RBP),%RAX |
0x4c7529 MOV (%RAX),%RDX |
0x4c752c MOV (%RSI),%RSI |
0x4c752f MOV %RBX,%RAX |
0x4c7532 NOT %RAX |
0x4c7535 ADD %RAX,%R14 |
0x4c7538 XOR %EDI,%EDI |
0x4c753a MOV %R14,-0x30(%RBP) |
0x4c753e MOV %RDX,-0x48(%RBP) |
0x4c7542 MOV %RSI,-0x40(%RBP) |
0x4c7546 JMP 4c7566 |
0x4c7548 NOPL (%RAX,%RAX,1) |
(3808) 0x4c7550 VMOVSD %XMM0,(%RSI,%R8,8) |
(3808) 0x4c7556 LEA 0x1(%RDI),%RAX |
(3808) 0x4c755a CMP %R14,%RDI |
(3808) 0x4c755d MOV %RAX,%RDI |
(3808) 0x4c7560 JE 4c813e |
(3808) 0x4c7566 LEA (%RBX,%RDI,1),%R8 |
(3808) 0x4c756a MOV (%RDX,%R8,8),%R15 |
(3808) 0x4c756e MOV 0x8(%RDX,%R8,8),%R9 |
(3808) 0x4c7573 VXORPD %XMM0,%XMM0,%XMM0 |
(3808) 0x4c7577 MOV %R9,%RCX |
(3808) 0x4c757a SUB %R15,%RCX |
(3808) 0x4c757d JLE 4c7550 |
(3808) 0x4c757f MOV -0x58(%RBP),%RAX |
(3808) 0x4c7583 MOV (%RAX),%R10 |
(3808) 0x4c7586 MOV 0x20(%RBP),%RAX |
(3808) 0x4c758a MOV (%RAX),%R11 |
(3808) 0x4c758d MOV 0x10(%RBP),%RAX |
(3808) 0x4c7591 MOV (%RAX),%R12 |
(3808) 0x4c7594 MOV %RCX,%R13 |
(3808) 0x4c7597 AND $-0x2,%R13 |
(3808) 0x4c759b JE 4c760c |
(3808) 0x4c759d LEA -0x1(%R13),%RBX |
(3808) 0x4c75a1 LEA (%R10,%R15,8),%R14 |
(3808) 0x4c75a5 MOV %R15,-0x38(%RBP) |
(3808) 0x4c75a9 LEA (%R12,%R15,8),%R15 |
(3808) 0x4c75ad VXORPD %XMM0,%XMM0,%XMM0 |
(3808) 0x4c75b1 XOR %ESI,%ESI |
(3808) 0x4c75b3 NOPW %CS:(%RAX,%RAX,1) |
(3810) 0x4c75c0 MOV (%R15,%RSI,8),%RDX |
(3810) 0x4c75c4 MOV 0x8(%R15,%RSI,8),%RAX |
(3810) 0x4c75c9 VMOVSD (%R11,%RDX,8),%XMM1 |
(3810) 0x4c75cf VMOVHPD (%R11,%RAX,8),%XMM1,%XMM1 |
(3810) 0x4c75d5 VFNMADD231PD (%R14,%RSI,8),%XMM1,%XMM0 |
(3810) 0x4c75db ADD $0x2,%RSI |
(3810) 0x4c75df CMP %RBX,%RSI |
(3810) 0x4c75e2 JBE 4c75c0 |
(3808) 0x4c75e4 VSHUFPD $0x1,%XMM0,%XMM0,%XMM1 |
(3808) 0x4c75e9 VADDSD %XMM1,%XMM0,%XMM0 |
(3808) 0x4c75ed CMP %R13,%RCX |
(3808) 0x4c75f0 MOV -0x50(%RBP),%RBX |
(3808) 0x4c75f4 MOV -0x30(%RBP),%R14 |
(3808) 0x4c75f8 MOV -0x48(%RBP),%RDX |
(3808) 0x4c75fc MOV -0x40(%RBP),%RSI |
(3808) 0x4c7600 MOV -0x38(%RBP),%R15 |
(3808) 0x4c7604 JE 4c7550 |
(3808) 0x4c760a JMP 4c760f |
(3808) 0x4c760c XOR %R13D,%R13D |
(3808) 0x4c760f ADD %R15,%R13 |
(3808) 0x4c7612 NOPW %CS:(%RAX,%RAX,1) |
(3809) 0x4c7620 MOV (%R12,%R13,8),%RAX |
(3809) 0x4c7624 VMOVSD (%R11,%RAX,8),%XMM1 |
(3809) 0x4c762a VFNMADD231SD (%R10,%R13,8),%XMM1,%XMM0 |
(3809) 0x4c7630 INC %R13 |
(3809) 0x4c7633 CMP %R13,%R9 |
(3809) 0x4c7636 JNE 4c7620 |
(3808) 0x4c7638 JMP 4c7550 |
0x4c763d VUCOMISD 0x209cb(%RIP),%XMM4 |
0x4c7645 JNE 4c79ed |
0x4c764b VUCOMISD 0x209bd(%RIP),%XMM0 |
0x4c7653 JNE 4c7b2e |
0x4c7659 CMP %R14,%RBX |
0x4c765c JGE 4c813e |
0x4c7662 MOV -0x30(%RBP),%RAX |
0x4c7666 MOV (%RAX),%R15 |
0x4c7669 MOV (%RSI),%RSI |
0x4c766c MOV %RBX,%RAX |
0x4c766f NOT %RAX |
0x4c7672 ADD %RAX,%R14 |
0x4c7675 XOR %R8D,%R8D |
0x4c7678 MOV %R14,-0x30(%RBP) |
0x4c767c MOV %R15,-0x48(%RBP) |
0x4c7680 MOV %RSI,-0x40(%RBP) |
0x4c7684 JMP 4c76a6 |
0x4c7686 NOPW %CS:(%RAX,%RAX,1) |
(3793) 0x4c7690 VMOVSD %XMM0,(%RSI,%R9,8) |
(3793) 0x4c7696 LEA 0x1(%R8),%RAX |
(3793) 0x4c769a CMP %R14,%R8 |
(3793) 0x4c769d MOV %RAX,%R8 |
(3793) 0x4c76a0 JE 4c813e |
(3793) 0x4c76a6 LEA (%RBX,%R8,1),%R9 |
(3793) 0x4c76aa VMOVSD (%RDI,%R9,8),%XMM0 |
(3793) 0x4c76b0 MOV (%R15,%R9,8),%RAX |
(3793) 0x4c76b4 MOV 0x8(%R15,%R9,8),%R10 |
(3793) 0x4c76b9 MOV %R10,%RCX |
(3793) 0x4c76bc SUB %RAX,%RCX |
(3793) 0x4c76bf JLE 4c7690 |
(3793) 0x4c76c1 MOV %RAX,-0x38(%RBP) |
(3793) 0x4c76c5 MOV -0x58(%RBP),%RAX |
(3793) 0x4c76c9 MOV (%RAX),%R11 |
(3793) 0x4c76cc MOV 0x20(%RBP),%RAX |
(3793) 0x4c76d0 MOV (%RAX),%R12 |
(3793) 0x4c76d3 MOV 0x10(%RBP),%RAX |
(3793) 0x4c76d7 MOV (%RAX),%R13 |
(3793) 0x4c76da MOV %RCX,%RDX |
(3793) 0x4c76dd AND $-0x2,%RDX |
(3793) 0x4c76e1 JE 4c7760 |
(3793) 0x4c76e3 LEA -0x1(%RDX),%RBX |
(3793) 0x4c76e7 MOV -0x38(%RBP),%RAX |
(3793) 0x4c76eb LEA (%R11,%RAX,8),%RSI |
(3793) 0x4c76ef LEA (,%RAX,8),%R14 |
(3793) 0x4c76f7 ADD %R13,%R14 |
(3793) 0x4c76fa VXORPD %XMM1,%XMM1,%XMM1 |
(3793) 0x4c76fe XOR %R15D,%R15D |
(3793) 0x4c7701 NOPW %CS:(%RAX,%RAX,1) |
(3795) 0x4c7710 MOV (%R14,%R15,8),%RDI |
(3795) 0x4c7714 MOV 0x8(%R14,%R15,8),%RAX |
(3795) 0x4c7719 VMOVSD (%R12,%RDI,8),%XMM2 |
(3795) 0x4c771f VMOVHPD (%R12,%RAX,8),%XMM2,%XMM2 |
(3795) 0x4c7725 VFMADD231PD (%RSI,%R15,8),%XMM2,%XMM1 |
(3795) 0x4c772b ADD $0x2,%R15 |
(3795) 0x4c772f CMP %RBX,%R15 |
(3795) 0x4c7732 JBE 4c7710 |
(3793) 0x4c7734 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(3793) 0x4c7739 VADDSD %XMM2,%XMM1,%XMM1 |
(3793) 0x4c773d VADDSD %XMM1,%XMM0,%XMM0 |
(3793) 0x4c7741 CMP %RDX,%RCX |
(3793) 0x4c7744 MOV -0x50(%RBP),%RBX |
(3793) 0x4c7748 MOV -0x30(%RBP),%R14 |
(3793) 0x4c774c MOV 0x28(%RBP),%RDI |
(3793) 0x4c7750 MOV -0x48(%RBP),%R15 |
(3793) 0x4c7754 MOV -0x40(%RBP),%RSI |
(3793) 0x4c7758 JE 4c7690 |
(3793) 0x4c775e JMP 4c7762 |
(3793) 0x4c7760 XOR %EDX,%EDX |
(3793) 0x4c7762 ADD -0x38(%RBP),%RDX |
(3793) 0x4c7766 NOPW %CS:(%RAX,%RAX,1) |
(3794) 0x4c7770 MOV (%R13,%RDX,8),%RAX |
(3794) 0x4c7775 VMOVSD (%R12,%RAX,8),%XMM1 |
(3794) 0x4c777b VFMADD231SD (%R11,%RDX,8),%XMM1,%XMM0 |
(3794) 0x4c7781 INC %RDX |
(3794) 0x4c7784 CMP %RDX,%R10 |
(3794) 0x4c7787 JNE 4c7770 |
(3793) 0x4c7789 JMP 4c7690 |
0x4c778e VUCOMISD 0x2178a(%RIP),%XMM0 |
0x4c7796 JNE 4c7c7e |
0x4c779c CMP %R14,%RBX |
0x4c779f JGE 4c813e |
0x4c77a5 MOV -0x30(%RBP),%RAX |
0x4c77a9 MOV (%RAX),%R15 |
0x4c77ac MOV (%RSI),%RSI |
0x4c77af MOV %RBX,%RAX |
0x4c77b2 NOT %RAX |
0x4c77b5 ADD %RAX,%R14 |
0x4c77b8 XOR %R8D,%R8D |
0x4c77bb MOV %R14,-0x30(%RBP) |
0x4c77bf MOV %R15,-0x48(%RBP) |
0x4c77c3 MOV %RSI,-0x40(%RBP) |
0x4c77c7 JMP 4c77e6 |
0x4c77c9 NOPL (%RAX) |
(3799) 0x4c77d0 VMOVSD %XMM0,(%RSI,%R9,8) |
(3799) 0x4c77d6 LEA 0x1(%R8),%RAX |
(3799) 0x4c77da CMP %R14,%R8 |
(3799) 0x4c77dd MOV %RAX,%R8 |
(3799) 0x4c77e0 JE 4c813e |
(3799) 0x4c77e6 LEA (%RBX,%R8,1),%R9 |
(3799) 0x4c77ea VMOVSD (%RDI,%R9,8),%XMM0 |
(3799) 0x4c77f0 MOV (%R15,%R9,8),%RAX |
(3799) 0x4c77f4 MOV 0x8(%R15,%R9,8),%R10 |
(3799) 0x4c77f9 MOV %R10,%RCX |
(3799) 0x4c77fc SUB %RAX,%RCX |
(3799) 0x4c77ff JLE 4c77d0 |
(3799) 0x4c7801 MOV %RAX,-0x38(%RBP) |
(3799) 0x4c7805 MOV -0x58(%RBP),%RAX |
(3799) 0x4c7809 MOV (%RAX),%R11 |
(3799) 0x4c780c MOV 0x20(%RBP),%RAX |
(3799) 0x4c7810 MOV (%RAX),%R12 |
(3799) 0x4c7813 MOV 0x10(%RBP),%RAX |
(3799) 0x4c7817 MOV (%RAX),%R13 |
(3799) 0x4c781a MOV %RCX,%RDX |
(3799) 0x4c781d AND $-0x2,%RDX |
(3799) 0x4c7821 JE 4c78a0 |
(3799) 0x4c7823 LEA -0x1(%RDX),%RBX |
(3799) 0x4c7827 MOV -0x38(%RBP),%RAX |
(3799) 0x4c782b LEA (%R11,%RAX,8),%RSI |
(3799) 0x4c782f LEA (,%RAX,8),%R14 |
(3799) 0x4c7837 ADD %R13,%R14 |
(3799) 0x4c783a VXORPD %XMM1,%XMM1,%XMM1 |
(3799) 0x4c783e XOR %R15D,%R15D |
(3799) 0x4c7841 NOPW %CS:(%RAX,%RAX,1) |
(3801) 0x4c7850 MOV (%R14,%R15,8),%RDI |
(3801) 0x4c7854 MOV 0x8(%R14,%R15,8),%RAX |
(3801) 0x4c7859 VMOVSD (%R12,%RDI,8),%XMM2 |
(3801) 0x4c785f VMOVHPD (%R12,%RAX,8),%XMM2,%XMM2 |
(3801) 0x4c7865 VFNMADD231PD (%RSI,%R15,8),%XMM2,%XMM1 |
(3801) 0x4c786b ADD $0x2,%R15 |
(3801) 0x4c786f CMP %RBX,%R15 |
(3801) 0x4c7872 JBE 4c7850 |
(3799) 0x4c7874 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(3799) 0x4c7879 VADDSD %XMM2,%XMM1,%XMM1 |
(3799) 0x4c787d VADDSD %XMM1,%XMM0,%XMM0 |
(3799) 0x4c7881 CMP %RDX,%RCX |
(3799) 0x4c7884 MOV -0x50(%RBP),%RBX |
(3799) 0x4c7888 MOV -0x30(%RBP),%R14 |
(3799) 0x4c788c MOV 0x28(%RBP),%RDI |
(3799) 0x4c7890 MOV -0x48(%RBP),%R15 |
(3799) 0x4c7894 MOV -0x40(%RBP),%RSI |
(3799) 0x4c7898 JE 4c77d0 |
(3799) 0x4c789e JMP 4c78a2 |
(3799) 0x4c78a0 XOR %EDX,%EDX |
(3799) 0x4c78a2 ADD -0x38(%RBP),%RDX |
(3799) 0x4c78a6 NOPW %CS:(%RAX,%RAX,1) |
(3800) 0x4c78b0 MOV (%R13,%RDX,8),%RAX |
(3800) 0x4c78b5 VMOVSD (%R12,%RAX,8),%XMM1 |
(3800) 0x4c78bb VFNMADD231SD (%R11,%RDX,8),%XMM1,%XMM0 |
(3800) 0x4c78c1 INC %RDX |
(3800) 0x4c78c4 CMP %RDX,%R10 |
(3800) 0x4c78c7 JNE 4c78b0 |
(3799) 0x4c78c9 JMP 4c77d0 |
0x4c78ce CMP %R14,%RBX |
0x4c78d1 JGE 4c813e |
0x4c78d7 MOV -0x30(%RBP),%RAX |
0x4c78db MOV (%RAX),%RDX |
0x4c78de MOV (%RSI),%RSI |
0x4c78e1 MOV %RBX,%RAX |
0x4c78e4 NOT %RAX |
0x4c78e7 ADD %RAX,%R14 |
0x4c78ea XOR %EDI,%EDI |
0x4c78ec MOV %R14,-0x30(%RBP) |
0x4c78f0 MOV %RDX,-0x48(%RBP) |
0x4c78f4 MOV %RSI,-0x40(%RBP) |
0x4c78f8 JMP 4c791a |
0x4c78fa NOPW (%RAX,%RAX,1) |
(3805) 0x4c7900 VMULSD %XMM0,%XMM1,%XMM1 |
(3805) 0x4c7904 VMOVSD %XMM1,(%RSI,%R8,8) |
(3805) 0x4c790a LEA 0x1(%RDI),%RAX |
(3805) 0x4c790e CMP %R14,%RDI |
(3805) 0x4c7911 MOV %RAX,%RDI |
(3805) 0x4c7914 JE 4c813e |
(3805) 0x4c791a LEA (%RBX,%RDI,1),%R8 |
(3805) 0x4c791e MOV (%RDX,%R8,8),%R15 |
(3805) 0x4c7922 MOV 0x8(%RDX,%R8,8),%R9 |
(3805) 0x4c7927 VXORPD %XMM1,%XMM1,%XMM1 |
(3805) 0x4c792b MOV %R9,%RCX |
(3805) 0x4c792e SUB %R15,%RCX |
(3805) 0x4c7931 JLE 4c7900 |
(3805) 0x4c7933 MOV -0x58(%RBP),%RAX |
(3805) 0x4c7937 MOV (%RAX),%R10 |
(3805) 0x4c793a MOV 0x20(%RBP),%RAX |
(3805) 0x4c793e MOV (%RAX),%R11 |
(3805) 0x4c7941 MOV 0x10(%RBP),%RAX |
(3805) 0x4c7945 MOV (%RAX),%R12 |
(3805) 0x4c7948 MOV %RCX,%R13 |
(3805) 0x4c794b AND $-0x2,%R13 |
(3805) 0x4c794f JE 4c79bc |
(3805) 0x4c7951 LEA -0x1(%R13),%RBX |
(3805) 0x4c7955 LEA (%R10,%R15,8),%R14 |
(3805) 0x4c7959 MOV %R15,-0x38(%RBP) |
(3805) 0x4c795d LEA (%R12,%R15,8),%R15 |
(3805) 0x4c7961 VXORPD %XMM1,%XMM1,%XMM1 |
(3805) 0x4c7965 XOR %ESI,%ESI |
(3805) 0x4c7967 NOPW (%RAX,%RAX,1) |
(3807) 0x4c7970 MOV (%R15,%RSI,8),%RDX |
(3807) 0x4c7974 MOV 0x8(%R15,%RSI,8),%RAX |
(3807) 0x4c7979 VMOVSD (%R11,%RDX,8),%XMM2 |
(3807) 0x4c797f VMOVHPD (%R11,%RAX,8),%XMM2,%XMM2 |
(3807) 0x4c7985 VFMADD231PD (%R14,%RSI,8),%XMM2,%XMM1 |
(3807) 0x4c798b ADD $0x2,%RSI |
(3807) 0x4c798f CMP %RBX,%RSI |
(3807) 0x4c7992 JBE 4c7970 |
(3805) 0x4c7994 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(3805) 0x4c7999 VADDSD %XMM2,%XMM1,%XMM1 |
(3805) 0x4c799d CMP %R13,%RCX |
(3805) 0x4c79a0 MOV -0x50(%RBP),%RBX |
(3805) 0x4c79a4 MOV -0x30(%RBP),%R14 |
(3805) 0x4c79a8 MOV -0x48(%RBP),%RDX |
(3805) 0x4c79ac MOV -0x40(%RBP),%RSI |
(3805) 0x4c79b0 MOV -0x38(%RBP),%R15 |
(3805) 0x4c79b4 JE 4c7900 |
(3805) 0x4c79ba JMP 4c79bf |
(3805) 0x4c79bc XOR %R13D,%R13D |
(3805) 0x4c79bf ADD %R15,%R13 |
(3805) 0x4c79c2 NOPW %CS:(%RAX,%RAX,1) |
(3806) 0x4c79d0 MOV (%R12,%R13,8),%RAX |
(3806) 0x4c79d4 VMOVSD (%R11,%RAX,8),%XMM2 |
(3806) 0x4c79da VFMADD231SD (%R10,%R13,8),%XMM2,%XMM1 |
(3806) 0x4c79e0 INC %R13 |
(3806) 0x4c79e3 CMP %R13,%R9 |
(3806) 0x4c79e6 JNE 4c79d0 |
(3805) 0x4c79e8 JMP 4c7900 |
0x4c79ed VUCOMISD 0x2061b(%RIP),%XMM0 |
0x4c79f5 JNE 4c7dbe |
0x4c79fb CMP %R14,%RBX |
0x4c79fe JGE 4c813e |
0x4c7a04 MOV -0x30(%RBP),%RAX |
0x4c7a08 MOV (%RAX),%R15 |
0x4c7a0b MOV (%RSI),%RSI |
0x4c7a0e MOV %RBX,%RAX |
0x4c7a11 NOT %RAX |
0x4c7a14 ADD %RAX,%R14 |
0x4c7a17 XOR %R8D,%R8D |
0x4c7a1a MOV %R14,-0x30(%RBP) |
0x4c7a1e MOV %R15,-0x48(%RBP) |
0x4c7a22 MOV %RSI,-0x40(%RBP) |
0x4c7a26 JMP 4c7a46 |
0x4c7a28 NOPL (%RAX,%RAX,1) |
(3784) 0x4c7a30 VMOVSD %XMM0,(%RSI,%R9,8) |
(3784) 0x4c7a36 LEA 0x1(%R8),%RAX |
(3784) 0x4c7a3a CMP %R14,%R8 |
(3784) 0x4c7a3d MOV %RAX,%R8 |
(3784) 0x4c7a40 JE 4c813e |
(3784) 0x4c7a46 LEA (%RBX,%R8,1),%R9 |
(3784) 0x4c7a4a VMULSD (%RDI,%R9,8),%XMM4,%XMM0 |
(3784) 0x4c7a50 MOV (%R15,%R9,8),%RAX |
(3784) 0x4c7a54 MOV 0x8(%R15,%R9,8),%R10 |
(3784) 0x4c7a59 MOV %R10,%RCX |
(3784) 0x4c7a5c SUB %RAX,%RCX |
(3784) 0x4c7a5f JLE 4c7a30 |
(3784) 0x4c7a61 MOV %RAX,-0x38(%RBP) |
(3784) 0x4c7a65 MOV -0x58(%RBP),%RAX |
(3784) 0x4c7a69 MOV (%RAX),%R11 |
(3784) 0x4c7a6c MOV 0x20(%RBP),%RAX |
(3784) 0x4c7a70 MOV (%RAX),%R12 |
(3784) 0x4c7a73 MOV 0x10(%RBP),%RAX |
(3784) 0x4c7a77 MOV (%RAX),%R13 |
(3784) 0x4c7a7a MOV %RCX,%RDX |
(3784) 0x4c7a7d AND $-0x2,%RDX |
(3784) 0x4c7a81 JE 4c7b00 |
(3784) 0x4c7a83 LEA -0x1(%RDX),%RSI |
(3784) 0x4c7a87 MOV -0x38(%RBP),%RAX |
(3784) 0x4c7a8b LEA (%R11,%RAX,8),%RBX |
(3784) 0x4c7a8f LEA (,%RAX,8),%R14 |
(3784) 0x4c7a97 ADD %R13,%R14 |
(3784) 0x4c7a9a VXORPD %XMM1,%XMM1,%XMM1 |
(3784) 0x4c7a9e XOR %R15D,%R15D |
(3784) 0x4c7aa1 NOPW %CS:(%RAX,%RAX,1) |
(3786) 0x4c7ab0 MOV (%R14,%R15,8),%RDI |
(3786) 0x4c7ab4 MOV 0x8(%R14,%R15,8),%RAX |
(3786) 0x4c7ab9 VMOVSD (%R12,%RDI,8),%XMM2 |
(3786) 0x4c7abf VMOVHPD (%R12,%RAX,8),%XMM2,%XMM2 |
(3786) 0x4c7ac5 VFMADD231PD (%RBX,%R15,8),%XMM2,%XMM1 |
(3786) 0x4c7acb ADD $0x2,%R15 |
(3786) 0x4c7acf CMP %RSI,%R15 |
(3786) 0x4c7ad2 JBE 4c7ab0 |
(3784) 0x4c7ad4 VSHUFPD $0x1,%XMM1,%XMM1,%XMM2 |
(3784) 0x4c7ad9 VADDSD %XMM2,%XMM1,%XMM1 |
(3784) 0x4c7add VADDSD %XMM1,%XMM0,%XMM0 |
(3784) 0x4c7ae1 CMP %RDX,%RCX |
(3784) 0x4c7ae4 MOV -0x50(%RBP),%RBX |
(3784) 0x4c7ae8 MOV -0x30(%RBP),%R14 |
(3784) 0x4c7aec MOV 0x28(%RBP),%RDI |
(3784) 0x4c7af0 MOV -0x48(%RBP),%R15 |
(3784) 0x4c7af4 MOV -0x40(%RBP),%RSI |
(3784) 0x4c7af8 JE 4c7a30 |
(3784) 0x4c7afe JMP 4c7b02 |
(3784) 0x4c7b00 XOR %EDX,%EDX |
(3784) 0x4c7b02 ADD -0x38(%RBP),%RDX |
(3784) 0x4c7b06 NOPW %CS:(%RAX,%RAX,1) |
(3785) 0x4c7b10 MOV (%R13,%RDX,8),%RAX |
(3785) 0x4c7b15 VMOVSD (%R12,%RAX,8),%XMM1 |
(3785) 0x4c7b1b VFMADD231SD (%R11,%RDX,8),%XMM1,%XMM0 |
(3785) 0x4c7b21 INC %RDX |
(3785) 0x4c7b24 CMP %RDX,%R10 |
(3785) 0x4c7b27 JNE 4c7b10 |
(3784) 0x4c7b29 JMP 4c7a30 |
0x4c7b2e VUCOMISD 0x213ea(%RIP),%XMM0 |
0x4c7b36 JNE 4c7efe |
0x4c7b3c CMP %R14,%RBX |
0x4c7b3f JGE 4c813e |
0x4c7b45 MOV -0x30(%RBP),%RAX |
0x4c7b49 MOV (%RAX),%R15 |
0x4c7b4c MOV (%RSI),%RSI |
0x4c7b4f MOV %RBX,%RAX |
0x4c7b52 NOT %RAX |
0x4c7b55 ADD %RAX,%R14 |
0x4c7b58 XOR %R8D,%R8D |
0x4c7b5b VMOVDDUP 0x22b25(%RIP),%XMM0 |
0x4c7b63 MOV %R14,-0x30(%RBP) |
0x4c7b67 MOV %R15,-0x48(%RBP) |
0x4c7b6b MOV %RSI,-0x40(%RBP) |
0x4c7b6f JMP 4c7b96 |
0x4c7b71 NOPW %CS:(%RAX,%RAX,1) |
(3790) 0x4c7b80 VMOVSD %XMM1,(%RSI,%R9,8) |
(3790) 0x4c7b86 LEA 0x1(%R8),%RAX |
(3790) 0x4c7b8a CMP %R14,%R8 |
(3790) 0x4c7b8d MOV %RAX,%R8 |
(3790) 0x4c7b90 JE 4c813e |
(3790) 0x4c7b96 LEA (%RBX,%R8,1),%R9 |
(3790) 0x4c7b9a VMOVSD (%RDI,%R9,8),%XMM1 |
(3790) 0x4c7ba0 VXORPD %XMM0,%XMM1,%XMM1 |
(3790) 0x4c7ba4 MOV (%R15,%R9,8),%RAX |
(3790) 0x4c7ba8 MOV 0x8(%R15,%R9,8),%R10 |
(3790) 0x4c7bad MOV %R10,%RCX |
(3790) 0x4c7bb0 SUB %RAX,%RCX |
(3790) 0x4c7bb3 JLE 4c7b80 |
(3790) 0x4c7bb5 MOV %RAX,-0x38(%RBP) |
(3790) 0x4c7bb9 MOV -0x58(%RBP),%RAX |
(3790) 0x4c7bbd MOV (%RAX),%R11 |
(3790) 0x4c7bc0 MOV 0x20(%RBP),%RAX |
(3790) 0x4c7bc4 MOV (%RAX),%R12 |
(3790) 0x4c7bc7 MOV 0x10(%RBP),%RAX |
(3790) 0x4c7bcb MOV (%RAX),%R13 |
(3790) 0x4c7bce MOV %RCX,%RDX |
(3790) 0x4c7bd1 AND $-0x2,%RDX |
(3790) 0x4c7bd5 JE 4c7c50 |
(3790) 0x4c7bd7 LEA -0x1(%RDX),%RSI |
(3790) 0x4c7bdb MOV -0x38(%RBP),%RAX |
(3790) 0x4c7bdf LEA (%R11,%RAX,8),%RBX |
(3790) 0x4c7be3 LEA (,%RAX,8),%R14 |
(3790) 0x4c7beb ADD %R13,%R14 |
(3790) 0x4c7bee VXORPD %XMM2,%XMM2,%XMM2 |
(3790) 0x4c7bf2 XOR %R15D,%R15D |
(3790) 0x4c7bf5 NOPW %CS:(%RAX,%RAX,1) |
(3792) 0x4c7c00 MOV (%R14,%R15,8),%RDI |
(3792) 0x4c7c04 MOV 0x8(%R14,%R15,8),%RAX |
(3792) 0x4c7c09 VMOVSD (%R12,%RDI,8),%XMM3 |
(3792) 0x4c7c0f VMOVHPD (%R12,%RAX,8),%XMM3,%XMM3 |
(3792) 0x4c7c15 VFNMADD231PD (%RBX,%R15,8),%XMM3,%XMM2 |
(3792) 0x4c7c1b ADD $0x2,%R15 |
(3792) 0x4c7c1f CMP %RSI,%R15 |
(3792) 0x4c7c22 JBE 4c7c00 |
(3790) 0x4c7c24 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(3790) 0x4c7c29 VADDSD %XMM3,%XMM2,%XMM2 |
(3790) 0x4c7c2d VADDSD %XMM2,%XMM1,%XMM1 |
(3790) 0x4c7c31 CMP %RDX,%RCX |
(3790) 0x4c7c34 MOV -0x50(%RBP),%RBX |
(3790) 0x4c7c38 MOV -0x30(%RBP),%R14 |
(3790) 0x4c7c3c MOV 0x28(%RBP),%RDI |
(3790) 0x4c7c40 MOV -0x48(%RBP),%R15 |
(3790) 0x4c7c44 MOV -0x40(%RBP),%RSI |
(3790) 0x4c7c48 JE 4c7b80 |
(3790) 0x4c7c4e JMP 4c7c52 |
(3790) 0x4c7c50 XOR %EDX,%EDX |
(3790) 0x4c7c52 ADD -0x38(%RBP),%RDX |
(3790) 0x4c7c56 NOPW %CS:(%RAX,%RAX,1) |
(3791) 0x4c7c60 MOV (%R13,%RDX,8),%RAX |
(3791) 0x4c7c65 VMOVSD (%R12,%RAX,8),%XMM2 |
(3791) 0x4c7c6b VFNMADD231SD (%R11,%RDX,8),%XMM2,%XMM1 |
(3791) 0x4c7c71 INC %RDX |
(3791) 0x4c7c74 CMP %RDX,%R10 |
(3791) 0x4c7c77 JNE 4c7c60 |
(3790) 0x4c7c79 JMP 4c7b80 |
0x4c7c7e CMP %R14,%RBX |
0x4c7c81 JGE 4c813e |
0x4c7c87 MOV -0x30(%RBP),%RAX |
0x4c7c8b MOV (%RAX),%R15 |
0x4c7c8e MOV (%RSI),%RSI |
0x4c7c91 MOV %RBX,%RAX |
0x4c7c94 NOT %RAX |
0x4c7c97 ADD %RAX,%R14 |
0x4c7c9a XOR %R8D,%R8D |
0x4c7c9d VMOVDDUP 0x229e3(%RIP),%XMM1 |
0x4c7ca5 MOV %R14,-0x30(%RBP) |
0x4c7ca9 MOV %R15,-0x48(%RBP) |
0x4c7cad MOV %RSI,-0x40(%RBP) |
0x4c7cb1 JMP 4c7cda |
0x4c7cb3 NOPW %CS:(%RAX,%RAX,1) |
(3796) 0x4c7cc0 VMULSD %XMM0,%XMM2,%XMM2 |
(3796) 0x4c7cc4 VMOVSD %XMM2,(%RSI,%R9,8) |
(3796) 0x4c7cca LEA 0x1(%R8),%RAX |
(3796) 0x4c7cce CMP %R14,%R8 |
(3796) 0x4c7cd1 MOV %RAX,%R8 |
(3796) 0x4c7cd4 JE 4c813e |
(3796) 0x4c7cda LEA (%RBX,%R8,1),%R9 |
(3796) 0x4c7cde VMOVSD (%RDI,%R9,8),%XMM2 |
(3796) 0x4c7ce4 VXORPD %XMM1,%XMM2,%XMM2 |
(3796) 0x4c7ce8 MOV (%R15,%R9,8),%RAX |
(3796) 0x4c7cec MOV 0x8(%R15,%R9,8),%R10 |
(3796) 0x4c7cf1 MOV %R10,%RCX |
(3796) 0x4c7cf4 SUB %RAX,%RCX |
(3796) 0x4c7cf7 JLE 4c7cc0 |
(3796) 0x4c7cf9 MOV %RAX,-0x38(%RBP) |
(3796) 0x4c7cfd MOV -0x58(%RBP),%RAX |
(3796) 0x4c7d01 MOV (%RAX),%R11 |
(3796) 0x4c7d04 MOV 0x20(%RBP),%RAX |
(3796) 0x4c7d08 MOV (%RAX),%R12 |
(3796) 0x4c7d0b MOV 0x10(%RBP),%RAX |
(3796) 0x4c7d0f MOV (%RAX),%R13 |
(3796) 0x4c7d12 MOV %RCX,%RDX |
(3796) 0x4c7d15 AND $-0x2,%RDX |
(3796) 0x4c7d19 JE 4c7d90 |
(3796) 0x4c7d1b LEA -0x1(%RDX),%RBX |
(3796) 0x4c7d1f MOV -0x38(%RBP),%RAX |
(3796) 0x4c7d23 LEA (%R11,%RAX,8),%RSI |
(3796) 0x4c7d27 LEA (,%RAX,8),%R14 |
(3796) 0x4c7d2f ADD %R13,%R14 |
(3796) 0x4c7d32 VXORPD %XMM3,%XMM3,%XMM3 |
(3796) 0x4c7d36 XOR %R15D,%R15D |
(3796) 0x4c7d39 NOPL (%RAX) |
(3798) 0x4c7d40 MOV (%R14,%R15,8),%RDI |
(3798) 0x4c7d44 MOV 0x8(%R14,%R15,8),%RAX |
(3798) 0x4c7d49 VMOVSD (%R12,%RDI,8),%XMM4 |
(3798) 0x4c7d4f VMOVHPD (%R12,%RAX,8),%XMM4,%XMM4 |
(3798) 0x4c7d55 VFMADD231PD (%RSI,%R15,8),%XMM4,%XMM3 |
(3798) 0x4c7d5b ADD $0x2,%R15 |
(3798) 0x4c7d5f CMP %RBX,%R15 |
(3798) 0x4c7d62 JBE 4c7d40 |
(3796) 0x4c7d64 VSHUFPD $0x1,%XMM3,%XMM3,%XMM4 |
(3796) 0x4c7d69 VADDSD %XMM4,%XMM3,%XMM3 |
(3796) 0x4c7d6d VADDSD %XMM3,%XMM2,%XMM2 |
(3796) 0x4c7d71 CMP %RDX,%RCX |
(3796) 0x4c7d74 MOV -0x50(%RBP),%RBX |
(3796) 0x4c7d78 MOV -0x30(%RBP),%R14 |
(3796) 0x4c7d7c MOV 0x28(%RBP),%RDI |
(3796) 0x4c7d80 MOV -0x48(%RBP),%R15 |
(3796) 0x4c7d84 MOV -0x40(%RBP),%RSI |
(3796) 0x4c7d88 JE 4c7cc0 |
(3796) 0x4c7d8e JMP 4c7d92 |
(3796) 0x4c7d90 XOR %EDX,%EDX |
(3796) 0x4c7d92 ADD -0x38(%RBP),%RDX |
(3796) 0x4c7d96 NOPW %CS:(%RAX,%RAX,1) |
(3797) 0x4c7da0 MOV (%R13,%RDX,8),%RAX |
(3797) 0x4c7da5 VMOVSD (%R12,%RAX,8),%XMM3 |
(3797) 0x4c7dab VFMADD231SD (%R11,%RDX,8),%XMM3,%XMM2 |
(3797) 0x4c7db1 INC %RDX |
(3797) 0x4c7db4 CMP %RDX,%R10 |
(3797) 0x4c7db7 JNE 4c7da0 |
(3796) 0x4c7db9 JMP 4c7cc0 |
0x4c7dbe VUCOMISD 0x2115a(%RIP),%XMM0 |
0x4c7dc6 JNE 4c801e |
0x4c7dcc CMP %R14,%RBX |
0x4c7dcf JGE 4c813e |
0x4c7dd5 VXORPD 0x20ef3(%RIP),%XMM4,%XMM0 |
0x4c7ddd MOV -0x30(%RBP),%RAX |
0x4c7de1 MOV (%RAX),%RDX |
0x4c7de4 MOV (%RSI),%R15 |
0x4c7de7 MOV %RBX,%RAX |
0x4c7dea NOT %RAX |
0x4c7ded ADD %RAX,%R14 |
0x4c7df0 XOR %R8D,%R8D |
0x4c7df3 MOV %R14,-0x30(%RBP) |
0x4c7df7 MOV %RDX,-0x48(%RBP) |
0x4c7dfb MOV %R15,-0x40(%RBP) |
0x4c7dff JMP 4c7e17 |
(3781) 0x4c7e01 VMOVSD %XMM1,(%R15,%R9,8) |
(3781) 0x4c7e07 LEA 0x1(%R8),%RAX |
(3781) 0x4c7e0b CMP %R14,%R8 |
(3781) 0x4c7e0e MOV %RAX,%R8 |
(3781) 0x4c7e11 JE 4c813e |
(3781) 0x4c7e17 LEA (%RBX,%R8,1),%R9 |
(3781) 0x4c7e1b VMULSD (%RDI,%R9,8),%XMM0,%XMM1 |
(3781) 0x4c7e21 MOV (%RDX,%R9,8),%RAX |
(3781) 0x4c7e25 MOV 0x8(%RDX,%R9,8),%R10 |
(3781) 0x4c7e2a MOV %R10,%RCX |
(3781) 0x4c7e2d SUB %RAX,%RCX |
(3781) 0x4c7e30 JLE 4c7e01 |
(3781) 0x4c7e32 MOV %RAX,-0x38(%RBP) |
(3781) 0x4c7e36 MOV -0x58(%RBP),%RAX |
(3781) 0x4c7e3a MOV (%RAX),%R11 |
(3781) 0x4c7e3d MOV 0x20(%RBP),%RAX |
(3781) 0x4c7e41 MOV (%RAX),%R12 |
(3781) 0x4c7e44 MOV 0x10(%RBP),%RAX |
(3781) 0x4c7e48 MOV (%RAX),%R13 |
(3781) 0x4c7e4b MOV %RCX,%RSI |
(3781) 0x4c7e4e AND $-0x2,%RSI |
(3781) 0x4c7e52 JE 4c7ed0 |
(3781) 0x4c7e54 LEA -0x1(%RSI),%RDX |
(3781) 0x4c7e58 MOV -0x38(%RBP),%RAX |
(3781) 0x4c7e5c LEA (%R11,%RAX,8),%RBX |
(3781) 0x4c7e60 LEA (,%RAX,8),%R14 |
(3781) 0x4c7e68 ADD %R13,%R14 |
(3781) 0x4c7e6b VXORPD %XMM2,%XMM2,%XMM2 |
(3781) 0x4c7e6f XOR %R15D,%R15D |
(3781) 0x4c7e72 NOPW %CS:(%RAX,%RAX,1) |
(3783) 0x4c7e80 MOV (%R14,%R15,8),%RDI |
(3783) 0x4c7e84 MOV 0x8(%R14,%R15,8),%RAX |
(3783) 0x4c7e89 VMOVSD (%R12,%RDI,8),%XMM3 |
(3783) 0x4c7e8f VMOVHPD (%R12,%RAX,8),%XMM3,%XMM3 |
(3783) 0x4c7e95 VFNMADD231PD (%RBX,%R15,8),%XMM3,%XMM2 |
(3783) 0x4c7e9b ADD $0x2,%R15 |
(3783) 0x4c7e9f CMP %RDX,%R15 |
(3783) 0x4c7ea2 JBE 4c7e80 |
(3781) 0x4c7ea4 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(3781) 0x4c7ea9 VADDSD %XMM3,%XMM2,%XMM2 |
(3781) 0x4c7ead VADDSD %XMM2,%XMM1,%XMM1 |
(3781) 0x4c7eb1 CMP %RSI,%RCX |
(3781) 0x4c7eb4 MOV -0x50(%RBP),%RBX |
(3781) 0x4c7eb8 MOV -0x30(%RBP),%R14 |
(3781) 0x4c7ebc MOV 0x28(%RBP),%RDI |
(3781) 0x4c7ec0 MOV -0x48(%RBP),%RDX |
(3781) 0x4c7ec4 MOV -0x40(%RBP),%R15 |
(3781) 0x4c7ec8 JE 4c7e01 |
(3781) 0x4c7ece JMP 4c7ed2 |
(3781) 0x4c7ed0 XOR %ESI,%ESI |
(3781) 0x4c7ed2 ADD -0x38(%RBP),%RSI |
(3781) 0x4c7ed6 NOPW %CS:(%RAX,%RAX,1) |
(3782) 0x4c7ee0 MOV (%R13,%RSI,8),%RAX |
(3782) 0x4c7ee5 VMOVSD (%R12,%RAX,8),%XMM2 |
(3782) 0x4c7eeb VFNMADD231SD (%R11,%RSI,8),%XMM2,%XMM1 |
(3782) 0x4c7ef1 INC %RSI |
(3782) 0x4c7ef4 CMP %RSI,%R10 |
(3782) 0x4c7ef7 JNE 4c7ee0 |
(3781) 0x4c7ef9 JMP 4c7e01 |
0x4c7efe CMP %R14,%RBX |
0x4c7f01 JGE 4c813e |
0x4c7f07 MOV -0x30(%RBP),%RAX |
0x4c7f0b MOV (%RAX),%R15 |
0x4c7f0e MOV (%RSI),%RSI |
0x4c7f11 MOV %RBX,%RAX |
0x4c7f14 NOT %RAX |
0x4c7f17 ADD %RAX,%R14 |
0x4c7f1a XOR %R8D,%R8D |
0x4c7f1d MOV %R14,-0x30(%RBP) |
0x4c7f21 MOV %R15,-0x48(%RBP) |
0x4c7f25 MOV %RSI,-0x40(%RBP) |
0x4c7f29 JMP 4c7f45 |
(3787) 0x4c7f2b VMULSD %XMM0,%XMM1,%XMM1 |
(3787) 0x4c7f2f VMOVSD %XMM1,(%RSI,%R9,8) |
(3787) 0x4c7f35 LEA 0x1(%R8),%RAX |
(3787) 0x4c7f39 CMP %R14,%R8 |
(3787) 0x4c7f3c MOV %RAX,%R8 |
(3787) 0x4c7f3f JE 4c813e |
(3787) 0x4c7f45 LEA (%RBX,%R8,1),%R9 |
(3787) 0x4c7f49 VMOVSD (%RDI,%R9,8),%XMM1 |
(3787) 0x4c7f4f MOV (%R15,%R9,8),%RAX |
(3787) 0x4c7f53 MOV 0x8(%R15,%R9,8),%R10 |
(3787) 0x4c7f58 MOV %R10,%RCX |
(3787) 0x4c7f5b SUB %RAX,%RCX |
(3787) 0x4c7f5e JLE 4c7f2b |
(3787) 0x4c7f60 MOV %RAX,-0x38(%RBP) |
(3787) 0x4c7f64 MOV -0x58(%RBP),%RAX |
(3787) 0x4c7f68 MOV (%RAX),%R11 |
(3787) 0x4c7f6b MOV 0x20(%RBP),%RAX |
(3787) 0x4c7f6f MOV (%RAX),%R12 |
(3787) 0x4c7f72 MOV 0x10(%RBP),%RAX |
(3787) 0x4c7f76 MOV (%RAX),%R13 |
(3787) 0x4c7f79 MOV %RCX,%RDX |
(3787) 0x4c7f7c AND $-0x2,%RDX |
(3787) 0x4c7f80 JE 4c7ff0 |
(3787) 0x4c7f82 LEA -0x1(%RDX),%RSI |
(3787) 0x4c7f86 MOV -0x38(%RBP),%RAX |
(3787) 0x4c7f8a LEA (%R11,%RAX,8),%RBX |
(3787) 0x4c7f8e LEA (,%RAX,8),%R14 |
(3787) 0x4c7f96 ADD %R13,%R14 |
(3787) 0x4c7f99 VXORPD %XMM2,%XMM2,%XMM2 |
(3787) 0x4c7f9d XOR %R15D,%R15D |
(3789) 0x4c7fa0 MOV (%R14,%R15,8),%RDI |
(3789) 0x4c7fa4 MOV 0x8(%R14,%R15,8),%RAX |
(3789) 0x4c7fa9 VMOVSD (%R12,%RDI,8),%XMM3 |
(3789) 0x4c7faf VMOVHPD (%R12,%RAX,8),%XMM3,%XMM3 |
(3789) 0x4c7fb5 VFMADD231PD (%RBX,%R15,8),%XMM3,%XMM2 |
(3789) 0x4c7fbb ADD $0x2,%R15 |
(3789) 0x4c7fbf CMP %RSI,%R15 |
(3789) 0x4c7fc2 JBE 4c7fa0 |
(3787) 0x4c7fc4 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(3787) 0x4c7fc9 VADDSD %XMM3,%XMM2,%XMM2 |
(3787) 0x4c7fcd VADDSD %XMM2,%XMM1,%XMM1 |
(3787) 0x4c7fd1 CMP %RDX,%RCX |
(3787) 0x4c7fd4 MOV -0x50(%RBP),%RBX |
(3787) 0x4c7fd8 MOV -0x30(%RBP),%R14 |
(3787) 0x4c7fdc MOV 0x28(%RBP),%RDI |
(3787) 0x4c7fe0 MOV -0x48(%RBP),%R15 |
(3787) 0x4c7fe4 MOV -0x40(%RBP),%RSI |
(3787) 0x4c7fe8 JE 4c7f2b |
(3787) 0x4c7fee JMP 4c7ff2 |
(3787) 0x4c7ff0 XOR %EDX,%EDX |
(3787) 0x4c7ff2 ADD -0x38(%RBP),%RDX |
(3787) 0x4c7ff6 NOPW %CS:(%RAX,%RAX,1) |
(3788) 0x4c8000 MOV (%R13,%RDX,8),%RAX |
(3788) 0x4c8005 VMOVSD (%R12,%RAX,8),%XMM2 |
(3788) 0x4c800b VFMADD231SD (%R11,%RDX,8),%XMM2,%XMM1 |
(3788) 0x4c8011 INC %RDX |
(3788) 0x4c8014 CMP %RDX,%R10 |
(3788) 0x4c8017 JNE 4c8000 |
(3787) 0x4c8019 JMP 4c7f2b |
0x4c801e CMP %R14,%RBX |
0x4c8021 JGE 4c813e |
0x4c8027 MOV -0x30(%RBP),%RAX |
0x4c802b MOV (%RAX),%RDX |
0x4c802e MOV (%RSI),%R15 |
0x4c8031 MOV %RBX,%RAX |
0x4c8034 NOT %RAX |
0x4c8037 ADD %RAX,%R14 |
0x4c803a XOR %R8D,%R8D |
0x4c803d MOV %R14,-0x30(%RBP) |
0x4c8041 MOV %RDX,-0x48(%RBP) |
0x4c8045 MOV %R15,-0x40(%RBP) |
0x4c8049 JMP 4c8065 |
(3778) 0x4c804b VMULSD %XMM0,%XMM1,%XMM1 |
(3778) 0x4c804f VMOVSD %XMM1,(%R15,%R9,8) |
(3778) 0x4c8055 LEA 0x1(%R8),%RAX |
(3778) 0x4c8059 CMP %R14,%R8 |
(3778) 0x4c805c MOV %RAX,%R8 |
(3778) 0x4c805f JE 4c813e |
(3778) 0x4c8065 LEA (%RBX,%R8,1),%R9 |
(3778) 0x4c8069 VMULSD (%RDI,%R9,8),%XMM4,%XMM1 |
(3778) 0x4c806f MOV (%RDX,%R9,8),%RAX |
(3778) 0x4c8073 MOV 0x8(%RDX,%R9,8),%R10 |
(3778) 0x4c8078 MOV %R10,%RCX |
(3778) 0x4c807b SUB %RAX,%RCX |
(3778) 0x4c807e JLE 4c804b |
(3778) 0x4c8080 MOV %RAX,-0x38(%RBP) |
(3778) 0x4c8084 MOV -0x58(%RBP),%RAX |
(3778) 0x4c8088 MOV (%RAX),%R11 |
(3778) 0x4c808b MOV 0x20(%RBP),%RAX |
(3778) 0x4c808f MOV (%RAX),%R12 |
(3778) 0x4c8092 MOV 0x10(%RBP),%RAX |
(3778) 0x4c8096 MOV (%RAX),%R13 |
(3778) 0x4c8099 MOV %RCX,%RSI |
(3778) 0x4c809c AND $-0x2,%RSI |
(3778) 0x4c80a0 JE 4c8110 |
(3778) 0x4c80a2 LEA -0x1(%RSI),%RDX |
(3778) 0x4c80a6 MOV -0x38(%RBP),%RAX |
(3778) 0x4c80aa LEA (%R11,%RAX,8),%RBX |
(3778) 0x4c80ae LEA (,%RAX,8),%R14 |
(3778) 0x4c80b6 ADD %R13,%R14 |
(3778) 0x4c80b9 VXORPD %XMM2,%XMM2,%XMM2 |
(3778) 0x4c80bd XOR %R15D,%R15D |
(3780) 0x4c80c0 MOV (%R14,%R15,8),%RDI |
(3780) 0x4c80c4 MOV 0x8(%R14,%R15,8),%RAX |
(3780) 0x4c80c9 VMOVSD (%R12,%RDI,8),%XMM3 |
(3780) 0x4c80cf VMOVHPD (%R12,%RAX,8),%XMM3,%XMM3 |
(3780) 0x4c80d5 VFMADD231PD (%RBX,%R15,8),%XMM3,%XMM2 |
(3780) 0x4c80db ADD $0x2,%R15 |
(3780) 0x4c80df CMP %RDX,%R15 |
(3780) 0x4c80e2 JBE 4c80c0 |
(3778) 0x4c80e4 VSHUFPD $0x1,%XMM2,%XMM2,%XMM3 |
(3778) 0x4c80e9 VADDSD %XMM3,%XMM2,%XMM2 |
(3778) 0x4c80ed VADDSD %XMM2,%XMM1,%XMM1 |
(3778) 0x4c80f1 CMP %RSI,%RCX |
(3778) 0x4c80f4 MOV -0x50(%RBP),%RBX |
(3778) 0x4c80f8 MOV -0x30(%RBP),%R14 |
(3778) 0x4c80fc MOV 0x28(%RBP),%RDI |
(3778) 0x4c8100 MOV -0x48(%RBP),%RDX |
(3778) 0x4c8104 MOV -0x40(%RBP),%R15 |
(3778) 0x4c8108 JE 4c804b |
(3778) 0x4c810e JMP 4c8112 |
(3778) 0x4c8110 XOR %ESI,%ESI |
(3778) 0x4c8112 ADD -0x38(%RBP),%RSI |
(3778) 0x4c8116 NOPW %CS:(%RAX,%RAX,1) |
(3779) 0x4c8120 MOV (%R13,%RSI,8),%RAX |
(3779) 0x4c8125 VMOVSD (%R12,%RAX,8),%XMM2 |
(3779) 0x4c812b VFMADD231SD (%R11,%RSI,8),%XMM2,%XMM1 |
(3779) 0x4c8131 INC %RSI |
(3779) 0x4c8134 CMP %RSI,%R10 |
(3779) 0x4c8137 JNE 4c8120 |
(3778) 0x4c8139 JMP 4c804b |
0x4c813e ADD $0x38,%RSP |
0x4c8142 POP %RBX |
0x4c8143 POP %R12 |
0x4c8145 POP %R13 |
0x4c8147 POP %R14 |
0x4c8149 POP %R15 |
0x4c814b POP %RBP |
0x4c814c RET |
0x4c814d NOPL (%RAX) |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 266 |
nb uops | 284 |
loop length | 1074 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 9 |
micro-operation queue | 47.33 cycles |
front end | 47.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.40 | 21.67 | 21.67 | 26.50 | 19.40 | 20.00 | 26.50 | 26.50 | 26.50 | 19.20 | 21.67 |
cycles | 20.00 | 19.40 | 21.67 | 21.67 | 26.50 | 19.40 | 20.00 | 26.50 | 26.50 | 26.50 | 19.20 | 21.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 46.33 |
Stall cycles | 0.00 |
Front-end | 47.33 |
Dispatch | 26.50 |
Overall L1 | 47.33 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 1% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 3% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4c5bc0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4c5c40 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c71e8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x68> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5aa3f(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fc003,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fc999,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c71f6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x76> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R12,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c7224 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5aa03(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fca1c,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fc999,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c7233 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R12,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c7266 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5a9c6(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fca3e,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fc999,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RBX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4c73ad <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x22d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x20d87(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c750e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x38e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c72d6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x156> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x28(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x21b67(%RIP),%XMM4 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c763d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4bd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x20c49(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c778e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x60e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x23294(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7426 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x2a6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x21a0a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c78ce <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x74e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7566 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x3e6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x209cb(%RIP),%XMM4 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c79ed <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x86d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x209bd(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c7b2e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x9ae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c76a6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x526> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2178a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c7c7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xafe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c77e6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x666> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c791a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x79a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2061b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c7dbe <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc3e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7a46 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8c6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x213ea(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c7efe <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd7e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x22b25(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7b96 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa16> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x229e3(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7cda <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb5a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2115a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c801e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe9e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x20ef3(%RIP),%XMM4,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7e17 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc97> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7f45 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdc5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c8065 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xee5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 266 |
nb uops | 284 |
loop length | 1074 |
used x86 registers | 14 |
used mmx registers | 0 |
used xmm registers | 3 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 9 |
micro-operation queue | 47.33 cycles |
front end | 47.33 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 19.40 | 21.67 | 21.67 | 26.50 | 19.40 | 20.00 | 26.50 | 26.50 | 26.50 | 19.20 | 21.67 |
cycles | 20.00 | 19.40 | 21.67 | 21.67 | 26.50 | 19.40 | 20.00 | 26.50 | 26.50 | 26.50 | 19.20 | 21.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 46.33 |
Stall cycles | 0.00 |
Front-end | 47.33 |
Dispatch | 26.50 |
Overall L1 | 47.33 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 0% |
all | 11% |
load | 6% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
all | 1% |
load | 2% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 3% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 9% |
all | 13% |
load | 13% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 14% |
all | 11% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4c5bc0 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4c5c40 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %RAX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c71e8 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x68> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5aa3f(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fc003,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fc999,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBP),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RBX,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c71f6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x76> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R12,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c7224 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5aa03(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fca1c,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fc999,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf9,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JS 4c7233 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb3> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R12,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 4c7266 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe6> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0x5a9c6(%RIP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x4fa05a,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x4fca3e,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4cf9e0 <hypre_fprintf> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV $0x4fc999,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xfa,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 4d2330 <hypre_error_handler> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
VMOVSD 0x38(%RBP),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVQ %R13,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VXORPD %XMM1,%XMM1,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD %XMM1,%XMM4 | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RBX,-0x50(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JNE 4c73ad <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x22d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x20d87(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c750e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x38e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c72d6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x156> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x28(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VUCOMISD 0x21b67(%RIP),%XMM4 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c763d <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x4bd> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x20c49(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c778e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x60e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x23294(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7426 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x2a6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x21a0a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c78ce <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x74e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7566 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x3e6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x209cb(%RIP),%XMM4 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c79ed <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x86d> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VUCOMISD 0x209bd(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c7b2e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x9ae> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c76a6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x526> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2178a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c7c7e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xafe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c77e6 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x666> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c791a <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x79a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2061b(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c7dbe <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc3e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7a46 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0x8c6> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x213ea(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c7efe <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xd7e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x22b25(%RIP),%XMM0 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7b96 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xa16> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VMOVDDUP 0x229e3(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7cda <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xb5a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VUCOMISD 0x2115a(%RIP),%XMM0 | 2 | 1 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 1 |
JNE 4c801e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xe9e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
VXORPD 0x20ef3(%RIP),%XMM4,%XMM0 | 1 | 0.33 | 0.33 | 0.33 | 0.33 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0-1 | 0.33 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7e17 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xc97> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c7f45 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xdc5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
CMP %R14,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c813e <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xfbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x30(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %R8D,%R8D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R14,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R15,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c8065 <hypre_CSRMatrixMatvecOutOfPlace.extracted+0xee5> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD $0x38,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace.extracted– | 18.58 | 7.77 |
▼Loop 3793 - csr_matvec.c:248-341 - exec– | 0.92 | 0.33 |
○Loop 3795 - csr_matvec.c:337-339 - exec | 0.31 | 0.11 |
○Loop 3794 - csr_matvec.c:337-339 - exec | 0.24 | 0.09 |
▼Loop 3799 - csr_matvec.c:248-314 - exec– | 0.49 | 0.17 |
○Loop 3801 - csr_matvec.c:310-312 - exec | 8.42 | 2.99 |
○Loop 3800 - csr_matvec.c:310-312 - exec | 0.17 | 0.06 |
▼Loop 3811 - csr_matvec.c:248-263 - exec– | 0.33 | 0.12 |
○Loop 3813 - csr_matvec.c:259-261 - exec | 7.54 | 2.68 |
○Loop 3812 - csr_matvec.c:259-261 - exec | 0.16 | 0.06 |
▼Loop 3781 - csr_matvec.c:248-392 - exec– | 0 | 0 |
○Loop 3783 - csr_matvec.c:388-390 - exec | 0 | 0 |
○Loop 3782 - csr_matvec.c:388-390 - exec | 0 | 0 |
▼Loop 3790 - csr_matvec.c:248-353 - exec– | 0 | 0 |
○Loop 3791 - csr_matvec.c:349-351 - exec | 0 | 0 |
○Loop 3792 - csr_matvec.c:349-351 - exec | 0 | 0 |
▼Loop 3805 - csr_matvec.c:248-287 - exec– | 0 | 0 |
○Loop 3807 - csr_matvec.c:283-285 - exec | 0 | 0 |
○Loop 3806 - csr_matvec.c:283-285 - exec | 0 | 0 |
▼Loop 3808 - csr_matvec.c:248-275 - exec– | 0 | 0 |
○Loop 3809 - csr_matvec.c:271-273 - exec | 0 | 0 |
○Loop 3810 - csr_matvec.c:271-273 - exec | 0 | 0 |
▼Loop 3787 - csr_matvec.c:248-365 - exec– | 0 | 0 |
○Loop 3789 - csr_matvec.c:361-363 - exec | 0 | 0 |
○Loop 3788 - csr_matvec.c:361-363 - exec | 0 | 0 |
▼Loop 3778 - csr_matvec.c:248-404 - exec– | 0 | 0 |
○Loop 3780 - csr_matvec.c:400-402 - exec | 0 | 0 |
○Loop 3779 - csr_matvec.c:400-402 - exec | 0 | 0 |
▼Loop 3784 - csr_matvec.c:248-380 - exec– | 0 | 0 |
○Loop 3785 - csr_matvec.c:376-378 - exec | 0 | 0 |
○Loop 3786 - csr_matvec.c:376-378 - exec | 0 | 0 |
▼Loop 3796 - csr_matvec.c:248-326 - exec– | 0 | 0 |
○Loop 3797 - csr_matvec.c:322-324 - exec | 0 | 0 |
○Loop 3798 - csr_matvec.c:322-324 - exec | 0 | 0 |
▼Loop 3802 - csr_matvec.c:248-302 - exec– | 0 | 0 |
○Loop 3803 - csr_matvec.c:298-300 - exec | 0 | 0 |
○Loop 3804 - csr_matvec.c:298-300 - exec | 0 | 0 |