Loop Id: 575 | Module: exec | Source: par_multi_interp.c:1072-1125 | Coverage: 0.1% |
---|
Loop Id: 575 | Module: exec | Source: par_multi_interp.c:1072-1125 | Coverage: 0.1% |
---|
0x45ff20 MOV -0xb0(%RBP),%R13 |
0x45ff27 MOV -0x70(%RBP),%RDI |
0x45ff2b MOV -0xd0(%RBP),%R8 |
0x45ff32 MOV (%R13,%RDI,8),%RDI |
0x45ff37 LEA 0x8(,%RDI,8),%R11 |
0x45ff3f MOV (%R8,%RDI,8),%RCX |
0x45ff43 MOV %RDI,%RAX |
0x45ff46 ADD %R11,%R8 |
0x45ff49 NOT %RAX |
0x45ff4c MOV %R8,-0x90(%RBP) |
0x45ff53 MOV (%R8),%R8 |
0x45ff56 MOV %RCX,-0x38(%RBP) |
0x45ff5a CMP %R8,%RCX |
0x45ff5d JGE 460280 |
0x45ff63 MOV %RDI,-0xe0(%RBP) |
0x45ff6a MOV %RBX,%R13 |
0x45ff6d MOV -0x88(%RBP),%RDI |
0x45ff74 MOV %R11,-0xc0(%RBP) |
0x45ff7b JMP 45ff91 |
(578) 0x45ff80 INCQ -0x38(%RBP) |
(578) 0x45ff84 MOV -0x38(%RBP),%RDX |
(578) 0x45ff88 CMP %R8,%RDX |
(578) 0x45ff8b JGE 460268 |
(578) 0x45ff91 MOV -0x38(%RBP),%R11 |
(578) 0x45ff95 MOV -0x40(%RBP),%RDX |
(578) 0x45ff99 MOV -0x48(%RBP),%RBX |
(578) 0x45ff9d MOV (%RDX,%R11,8),%RCX |
(578) 0x45ffa1 LEA (,%RCX,8),%R11 |
(578) 0x45ffa9 CMP %R13,(%RBX,%RCX,8) |
(578) 0x45ffad JNE 45ff80 |
(578) 0x45ffaf MOV -0x80(%RBP),%R8 |
(578) 0x45ffb3 MOV -0x60(%RBP),%RDX |
(578) 0x45ffb7 MOV (%R8,%RCX,8),%R8 |
(578) 0x45ffbb MOV 0x8(%RDX,%R11,1),%RBX |
(578) 0x45ffc0 ADD %R8,%RBX |
(578) 0x45ffc3 CMP %RBX,%R8 |
(578) 0x45ffc6 JGE 460124 |
(578) 0x45ffcc MOV -0x8(%R10,%R14,1),%RDX |
(578) 0x45ffd1 LEA (%RDX,%RBX,8),%RBX |
(578) 0x45ffd5 LEA (%RDX,%R8,8),%R8 |
(578) 0x45ffd9 MOV %RBX,-0x68(%RBP) |
(578) 0x45ffdd SUB %R8,%RBX |
(578) 0x45ffe0 SUB $0x8,%RBX |
(578) 0x45ffe4 SHR $0x3,%RBX |
(578) 0x45ffe8 INC %RBX |
(578) 0x45ffeb AND $0x3,%EBX |
(578) 0x45ffee JE 460097 |
(578) 0x45fff4 CMP $0x1,%RBX |
(578) 0x45fff8 JE 46005e |
(578) 0x45fffa CMP $0x2,%RBX |
(578) 0x45fffe JE 46002f |
(578) 0x460000 MOV (%R8),%RDX |
(578) 0x460003 MOV %RDX,%RBX |
(578) 0x460006 LEA (%R12,%RDX,8),%RDX |
(578) 0x46000a MOV %RDX,-0x88(%RBP) |
(578) 0x460011 CMP %RAX,(%RDX) |
(578) 0x460014 JE 46002b |
(578) 0x460016 MOV (%R10,%R14,1),%RDX |
(578) 0x46001a MOV %RBX,(%RDX,%RSI,8) |
(578) 0x46001e MOV -0x88(%RBP),%RBX |
(578) 0x460025 INC %RSI |
(578) 0x460028 MOV %RAX,(%RBX) |
(578) 0x46002b ADD $0x8,%R8 |
(578) 0x46002f MOV (%R8),%RDX |
(578) 0x460032 MOV %RDX,%RBX |
(578) 0x460035 LEA (%R12,%RDX,8),%RDX |
(578) 0x460039 MOV %RDX,-0x88(%RBP) |
(578) 0x460040 CMP %RAX,(%RDX) |
(578) 0x460043 JE 46005a |
(578) 0x460045 MOV (%R10,%R14,1),%RDX |
(578) 0x460049 MOV %RBX,(%RDX,%RSI,8) |
(578) 0x46004d MOV -0x88(%RBP),%RBX |
(578) 0x460054 INC %RSI |
(578) 0x460057 MOV %RAX,(%RBX) |
(578) 0x46005a ADD $0x8,%R8 |
(578) 0x46005e MOV (%R8),%RDX |
(578) 0x460061 MOV %RDX,%RBX |
(578) 0x460064 LEA (%R12,%RDX,8),%RDX |
(578) 0x460068 MOV %RDX,-0x88(%RBP) |
(578) 0x46006f CMP %RAX,(%RDX) |
(578) 0x460072 JE 460089 |
(578) 0x460074 MOV (%R10,%R14,1),%RDX |
(578) 0x460078 MOV %RBX,(%RDX,%RSI,8) |
(578) 0x46007c MOV -0x88(%RBP),%RBX |
(578) 0x460083 INC %RSI |
(578) 0x460086 MOV %RAX,(%RBX) |
(578) 0x460089 ADD $0x8,%R8 |
(578) 0x46008d CMP %R8,-0x68(%RBP) |
(578) 0x460091 JE 460124 |
(578) 0x460097 MOV %RCX,-0x88(%RBP) |
(578) 0x46009e MOV %RDI,%RBX |
(580) 0x4600a1 MOV (%R8),%RDI |
(580) 0x4600a4 LEA (%R12,%RDI,8),%RDX |
(580) 0x4600a8 CMP %RAX,(%RDX) |
(580) 0x4600ab JE 4600bb |
(580) 0x4600ad MOV (%R10,%R14,1),%RCX |
(580) 0x4600b1 MOV %RDI,(%RCX,%RSI,8) |
(580) 0x4600b5 INC %RSI |
(580) 0x4600b8 MOV %RAX,(%RDX) |
(580) 0x4600bb LEA 0x8(%R8),%RDX |
(580) 0x4600bf MOV 0x8(%R8),%R8 |
(580) 0x4600c3 LEA (%R12,%R8,8),%RDI |
(580) 0x4600c7 CMP %RAX,(%RDI) |
(580) 0x4600ca JE 4600da |
(580) 0x4600cc MOV (%R10,%R14,1),%RCX |
(580) 0x4600d0 MOV %R8,(%RCX,%RSI,8) |
(580) 0x4600d4 INC %RSI |
(580) 0x4600d7 MOV %RAX,(%RDI) |
(580) 0x4600da MOV 0x8(%RDX),%R8 |
(580) 0x4600de LEA (%R12,%R8,8),%RDI |
(580) 0x4600e2 CMP %RAX,(%RDI) |
(580) 0x4600e5 JE 4600f5 |
(580) 0x4600e7 MOV (%R10,%R14,1),%RCX |
(580) 0x4600eb MOV %R8,(%RCX,%RSI,8) |
(580) 0x4600ef INC %RSI |
(580) 0x4600f2 MOV %RAX,(%RDI) |
(580) 0x4600f5 MOV 0x10(%RDX),%R8 |
(580) 0x4600f9 LEA (%R12,%R8,8),%RDI |
(580) 0x4600fd CMP %RAX,(%RDI) |
(580) 0x460100 JE 460110 |
(580) 0x460102 MOV (%R10,%R14,1),%RCX |
(580) 0x460106 MOV %R8,(%RCX,%RSI,8) |
(580) 0x46010a INC %RSI |
(580) 0x46010d MOV %RAX,(%RDI) |
(580) 0x460110 LEA 0x18(%RDX),%R8 |
(580) 0x460114 CMP %R8,-0x68(%RBP) |
(580) 0x460118 JNE 4600a1 |
(578) 0x46011a MOV -0x88(%RBP),%RCX |
(578) 0x460121 MOV %RBX,%RDI |
(578) 0x460124 MOV -0x78(%RBP),%RBX |
(578) 0x460128 MOV -0x58(%RBP),%RDX |
(578) 0x46012c MOV (%RBX,%RCX,8),%RCX |
(578) 0x460130 MOV 0x8(%RDX,%R11,1),%R8 |
(578) 0x460135 ADD %RCX,%R8 |
(578) 0x460138 CMP %R8,%RCX |
(578) 0x46013b JGE 460650 |
(578) 0x460141 MOV -0x8(%R9,%R14,1),%RBX |
(578) 0x460146 LEA (%RBX,%RCX,8),%RCX |
(578) 0x46014a LEA (%RBX,%R8,8),%RBX |
(578) 0x46014e MOV %RBX,%RDX |
(578) 0x460151 SUB %RCX,%RDX |
(578) 0x460154 SUB $0x8,%RDX |
(578) 0x460158 SHR $0x3,%RDX |
(578) 0x46015c INC %RDX |
(578) 0x46015f AND $0x3,%EDX |
(578) 0x460162 JE 4601cf |
(578) 0x460164 CMP $0x1,%RDX |
(578) 0x460168 JE 4601ac |
(578) 0x46016a CMP $0x2,%RDX |
(578) 0x46016e JE 46018e |
(578) 0x460170 MOV (%RCX),%R11 |
(578) 0x460173 LEA (%R15,%R11,8),%R8 |
(578) 0x460177 CMP %RAX,(%R8) |
(578) 0x46017a JE 46018a |
(578) 0x46017c MOV (%R9,%R14,1),%RDX |
(578) 0x460180 MOV %R11,(%RDX,%RDI,8) |
(578) 0x460184 INC %RDI |
(578) 0x460187 MOV %RAX,(%R8) |
(578) 0x46018a ADD $0x8,%RCX |
(578) 0x46018e MOV (%RCX),%R11 |
(578) 0x460191 LEA (%R15,%R11,8),%R8 |
(578) 0x460195 CMP %RAX,(%R8) |
(578) 0x460198 JE 4601a8 |
(578) 0x46019a MOV (%R9,%R14,1),%RDX |
(578) 0x46019e MOV %R11,(%RDX,%RDI,8) |
(578) 0x4601a2 INC %RDI |
(578) 0x4601a5 MOV %RAX,(%R8) |
(578) 0x4601a8 ADD $0x8,%RCX |
(578) 0x4601ac MOV (%RCX),%R11 |
(578) 0x4601af LEA (%R15,%R11,8),%R8 |
(578) 0x4601b3 CMP %RAX,(%R8) |
(578) 0x4601b6 JE 4601c6 |
(578) 0x4601b8 MOV (%R9,%R14,1),%RDX |
(578) 0x4601bc MOV %R11,(%RDX,%RDI,8) |
(578) 0x4601c0 INC %RDI |
(578) 0x4601c3 MOV %RAX,(%R8) |
(578) 0x4601c6 ADD $0x8,%RCX |
(578) 0x4601ca CMP %RBX,%RCX |
(578) 0x4601cd JE 460247 |
(579) 0x4601cf MOV (%RCX),%R8 |
(579) 0x4601d2 LEA (%R15,%R8,8),%RDX |
(579) 0x4601d6 CMP %RAX,(%RDX) |
(579) 0x4601d9 JE 4601e9 |
(579) 0x4601db MOV (%R9,%R14,1),%R11 |
(579) 0x4601df MOV %R8,(%R11,%RDI,8) |
(579) 0x4601e3 INC %RDI |
(579) 0x4601e6 MOV %RAX,(%RDX) |
(579) 0x4601e9 MOV 0x8(%RCX),%R8 |
(579) 0x4601ed LEA 0x8(%RCX),%RDX |
(579) 0x4601f1 LEA (%R15,%R8,8),%RCX |
(579) 0x4601f5 CMP %RAX,(%RCX) |
(579) 0x4601f8 JE 460208 |
(579) 0x4601fa MOV (%R9,%R14,1),%R11 |
(579) 0x4601fe MOV %R8,(%R11,%RDI,8) |
(579) 0x460202 INC %RDI |
(579) 0x460205 MOV %RAX,(%RCX) |
(579) 0x460208 MOV 0x8(%RDX),%R8 |
(579) 0x46020c LEA (%R15,%R8,8),%RCX |
(579) 0x460210 CMP %RAX,(%RCX) |
(579) 0x460213 JE 460223 |
(579) 0x460215 MOV (%R9,%R14,1),%R11 |
(579) 0x460219 MOV %R8,(%R11,%RDI,8) |
(579) 0x46021d INC %RDI |
(579) 0x460220 MOV %RAX,(%RCX) |
(579) 0x460223 MOV 0x10(%RDX),%R8 |
(579) 0x460227 LEA (%R15,%R8,8),%RCX |
(579) 0x46022b CMP %RAX,(%RCX) |
(579) 0x46022e JE 46023e |
(579) 0x460230 MOV (%R9,%R14,1),%R11 |
(579) 0x460234 MOV %R8,(%R11,%RDI,8) |
(579) 0x460238 INC %RDI |
(579) 0x46023b MOV %RAX,(%RCX) |
(579) 0x46023e LEA 0x18(%RDX),%RCX |
(579) 0x460242 CMP %RBX,%RCX |
(579) 0x460245 JNE 4601cf |
(578) 0x460247 MOV -0x90(%RBP),%RBX |
(578) 0x46024e INCQ -0x38(%RBP) |
(578) 0x460252 MOV -0x38(%RBP),%RDX |
(578) 0x460256 MOV (%RBX),%R8 |
(578) 0x460259 CMP %R8,%RDX |
(578) 0x46025c JL 45ff91 |
0x460262 NOPW (%RAX,%RAX,1) |
0x460268 MOV %RDI,-0x88(%RBP) |
0x46026f MOV -0xc0(%RBP),%R11 |
0x460276 MOV %R13,%RBX |
0x460279 MOV -0xe0(%RBP),%RDI |
0x460280 MOV -0xc8(%RBP),%RCX |
0x460287 MOV (%RCX,%RDI,8),%RAX |
0x46028b ADD %R11,%RCX |
0x46028e NOT %RDI |
0x460291 MOV %RCX,-0xc0(%RBP) |
0x460298 MOV (%RCX),%RCX |
0x46029b CMP %RAX,%RCX |
0x46029e JLE 460552 |
0x4602a4 MOV %R9,-0x68(%RBP) |
0x4602a8 MOV -0x88(%RBP),%R8 |
0x4602af MOV %R10,-0x90(%RBP) |
0x4602b6 MOV -0xd8(%RBP),%R13 |
0x4602bd JMP 4602cc |
(576) 0x4602c0 INC %RAX |
(576) 0x4602c3 CMP %RCX,%RAX |
(576) 0x4602c6 JGE 460540 |
(576) 0x4602cc MOV -0x50(%RBP),%R9 |
(576) 0x4602d0 MOV (%R9,%RAX,8),%RDX |
(576) 0x4602d4 LEA (,%RDX,8),%R11 |
(576) 0x4602dc CMP %RBX,(%R13,%RDX,8) |
(576) 0x4602e1 JNE 4602c0 |
(576) 0x4602e3 MOV -0xa0(%RBP),%R10 |
(576) 0x4602ea MOV -0x98(%RBP),%R9 |
(576) 0x4602f1 MOV (%R10,%RDX,8),%RDX |
(576) 0x4602f5 MOV 0x8(%R9,%R11,1),%R11 |
(576) 0x4602fa ADD %RDX,%R11 |
(576) 0x4602fd CMP %R11,%RDX |
(576) 0x460300 JGE 4602c0 |
(576) 0x460302 MOV -0xa8(%RBP),%RCX |
(576) 0x460309 MOV (%RCX,%R14,1),%R10 |
(576) 0x46030d LEA (%R10,%R11,8),%R9 |
(576) 0x460311 LEA (%R10,%RDX,8),%RDX |
(576) 0x460315 MOV %R9,-0x38(%RBP) |
(576) 0x460319 SUB %RDX,%R9 |
(576) 0x46031c SUB $0x8,%R9 |
(576) 0x460320 SHR $0x3,%R9 |
(576) 0x460324 INC %R9 |
(576) 0x460327 AND $0x3,%R9D |
(576) 0x46032b JE 4603c8 |
(576) 0x460331 CMP $0x1,%R9 |
(576) 0x460335 JE 460393 |
(576) 0x460337 CMP $0x2,%R9 |
(576) 0x46033b JE 460368 |
(576) 0x46033d MOV (%RDX),%RCX |
(576) 0x460340 TEST %RCX,%RCX |
(576) 0x460343 JS 460660 |
(576) 0x460349 LEA (%R15,%RCX,8),%R11 |
(576) 0x46034d CMP %RDI,(%R11) |
(576) 0x460350 JE 460364 |
(576) 0x460352 MOV -0x68(%RBP),%R10 |
(576) 0x460356 MOV (%R10,%R14,1),%R9 |
(576) 0x46035a MOV %RCX,(%R9,%R8,8) |
(576) 0x46035e INC %R8 |
(576) 0x460361 MOV %RDI,(%R11) |
(576) 0x460364 ADD $0x8,%RDX |
(576) 0x460368 MOV (%RDX),%RCX |
(576) 0x46036b TEST %RCX,%RCX |
(576) 0x46036e JS 460620 |
(576) 0x460374 LEA (%R15,%RCX,8),%R10 |
(576) 0x460378 CMP %RDI,(%R10) |
(576) 0x46037b JE 46038f |
(576) 0x46037d MOV -0x68(%RBP),%R9 |
(576) 0x460381 MOV (%R9,%R14,1),%R11 |
(576) 0x460385 MOV %RCX,(%R11,%R8,8) |
(576) 0x460389 INC %R8 |
(576) 0x46038c MOV %RDI,(%R10) |
(576) 0x46038f ADD $0x8,%RDX |
(576) 0x460393 MOV (%RDX),%RCX |
(576) 0x460396 TEST %RCX,%RCX |
(576) 0x460399 JS 4605f0 |
(576) 0x46039f LEA (%R15,%RCX,8),%R11 |
(576) 0x4603a3 CMP %RDI,(%R11) |
(576) 0x4603a6 JE 4603ba |
(576) 0x4603a8 MOV -0x68(%RBP),%R9 |
(576) 0x4603ac MOV (%R9,%R14,1),%R10 |
(576) 0x4603b0 MOV %RCX,(%R10,%R8,8) |
(576) 0x4603b4 INC %R8 |
(576) 0x4603b7 MOV %RDI,(%R11) |
(576) 0x4603ba ADD $0x8,%RDX |
(576) 0x4603be CMP %RDX,-0x38(%RBP) |
(576) 0x4603c2 JE 460527 |
(576) 0x4603c8 MOV %RAX,-0x88(%RBP) |
(576) 0x4603cf MOV -0x68(%RBP),%R9 |
(576) 0x4603d3 MOV -0x90(%RBP),%R10 |
(576) 0x4603da JMP 46044d |
(577) 0x4603e0 LEA (%R15,%RDX,8),%R11 |
(577) 0x4603e4 CMP %RDI,(%R11) |
(577) 0x4603e7 JE 4603f7 |
(577) 0x4603e9 MOV (%R9,%R14,1),%RAX |
(577) 0x4603ed MOV %RDX,(%RAX,%R8,8) |
(577) 0x4603f1 INC %R8 |
(577) 0x4603f4 MOV %RDI,(%R11) |
(577) 0x4603f7 MOV 0x8(%RCX),%RDX |
(577) 0x4603fb TEST %RDX,%RDX |
(577) 0x4603fe JS 4604b2 |
(577) 0x460404 LEA (%R15,%RDX,8),%R11 |
(577) 0x460408 CMP %RDI,(%R11) |
(577) 0x46040b JE 46041b |
(577) 0x46040d MOV (%R9,%R14,1),%RAX |
(577) 0x460411 MOV %RDX,(%RAX,%R8,8) |
(577) 0x460415 INC %R8 |
(577) 0x460418 MOV %RDI,(%R11) |
(577) 0x46041b MOV 0x10(%RCX),%RDX |
(577) 0x46041f TEST %RDX,%RDX |
(577) 0x460422 JS 4604e3 |
(577) 0x460428 LEA (%R15,%RDX,8),%R11 |
(577) 0x46042c CMP %RDI,(%R11) |
(577) 0x46042f JE 46043f |
(577) 0x460431 MOV (%R9,%R14,1),%RAX |
(577) 0x460435 MOV %RDX,(%RAX,%R8,8) |
(577) 0x460439 INC %R8 |
(577) 0x46043c MOV %RDI,(%R11) |
(577) 0x46043f LEA 0x18(%RCX),%RDX |
(577) 0x460443 CMP %RDX,-0x38(%RBP) |
(577) 0x460447 JE 460515 |
(577) 0x46044d MOV (%RDX),%RCX |
(577) 0x460450 TEST %RCX,%RCX |
(577) 0x460453 JS 4605c0 |
(577) 0x460459 LEA (%R15,%RCX,8),%R11 |
(577) 0x46045d CMP %RDI,(%R11) |
(577) 0x460460 JE 460470 |
(577) 0x460462 MOV (%R9,%R14,1),%RAX |
(577) 0x460466 MOV %RCX,(%RAX,%R8,8) |
(577) 0x46046a INC %R8 |
(577) 0x46046d MOV %RDI,(%R11) |
(577) 0x460470 LEA 0x8(%RDX),%RCX |
(577) 0x460474 MOV 0x8(%RDX),%RDX |
(577) 0x460478 TEST %RDX,%RDX |
(577) 0x46047b JNS 4603e0 |
(577) 0x460481 MOV %RDX,%R11 |
(577) 0x460484 NOT %R11 |
(577) 0x460487 LEA (%R12,%R11,8),%R11 |
(577) 0x46048b CMP %RDI,(%R11) |
(577) 0x46048e JE 4603f7 |
(577) 0x460494 MOV (%R10,%R14,1),%RAX |
(577) 0x460498 NOT %RDX |
(577) 0x46049b MOV %RDX,(%RAX,%RSI,8) |
(577) 0x46049f INC %RSI |
(577) 0x4604a2 MOV %RDI,(%R11) |
(577) 0x4604a5 MOV 0x8(%RCX),%RDX |
(577) 0x4604a9 TEST %RDX,%RDX |
(577) 0x4604ac JNS 460404 |
(577) 0x4604b2 MOV %RDX,%R11 |
(577) 0x4604b5 NOT %R11 |
(577) 0x4604b8 LEA (%R12,%R11,8),%R11 |
(577) 0x4604bc CMP %RDI,(%R11) |
(577) 0x4604bf JE 46041b |
(577) 0x4604c5 MOV (%R10,%R14,1),%RAX |
(577) 0x4604c9 NOT %RDX |
(577) 0x4604cc MOV %RDX,(%RAX,%RSI,8) |
(577) 0x4604d0 INC %RSI |
(577) 0x4604d3 MOV %RDI,(%R11) |
(577) 0x4604d6 MOV 0x10(%RCX),%RDX |
(577) 0x4604da TEST %RDX,%RDX |
(577) 0x4604dd JNS 460428 |
(577) 0x4604e3 MOV %RDX,%R11 |
(577) 0x4604e6 NOT %R11 |
(577) 0x4604e9 LEA (%R12,%R11,8),%R11 |
(577) 0x4604ed CMP %RDI,(%R11) |
(577) 0x4604f0 JE 46043f |
(577) 0x4604f6 MOV (%R10,%R14,1),%RAX |
(577) 0x4604fa NOT %RDX |
(577) 0x4604fd MOV %RDX,(%RAX,%RSI,8) |
(577) 0x460501 INC %RSI |
(577) 0x460504 LEA 0x18(%RCX),%RDX |
(577) 0x460508 MOV %RDI,(%R11) |
(577) 0x46050b CMP %RDX,-0x38(%RBP) |
(577) 0x46050f JNE 46044d |
(576) 0x460515 MOV %R9,-0x68(%RBP) |
(576) 0x460519 MOV -0x88(%RBP),%RAX |
(576) 0x460520 MOV %R10,-0x90(%RBP) |
(576) 0x460527 MOV -0xc0(%RBP),%R9 |
(576) 0x46052e INC %RAX |
(576) 0x460531 MOV (%R9),%RCX |
(576) 0x460534 CMP %RCX,%RAX |
(576) 0x460537 JL 4602cc |
0x46053d NOPL (%RAX) |
0x460540 MOV %R8,-0x88(%RBP) |
0x460547 MOV -0x68(%RBP),%R9 |
0x46054b MOV -0x90(%RBP),%R10 |
0x460552 INCQ -0x70(%RBP) |
0x460556 MOV -0x70(%RBP),%RDI |
0x46055a CMP %RDI,-0xb8(%RBP) |
0x460561 JG 45ff20 |
(577) 0x4605c0 MOV %RCX,%R11 |
(577) 0x4605c3 NOT %R11 |
(577) 0x4605c6 LEA (%R12,%R11,8),%R11 |
(577) 0x4605ca CMP %RDI,(%R11) |
(577) 0x4605cd JE 460470 |
(577) 0x4605d3 MOV (%R10,%R14,1),%RAX |
(577) 0x4605d7 NOT %RCX |
(577) 0x4605da MOV %RCX,(%RAX,%RSI,8) |
(577) 0x4605de INC %RSI |
(577) 0x4605e1 MOV %RDI,(%R11) |
(577) 0x4605e4 JMP 460470 |
(576) 0x4605f0 MOV %RCX,%R11 |
(576) 0x4605f3 NOT %R11 |
(576) 0x4605f6 LEA (%R12,%R11,8),%R10 |
(576) 0x4605fa CMP %RDI,(%R10) |
(576) 0x4605fd JE 4603ba |
(576) 0x460603 MOV -0x90(%RBP),%R9 |
(576) 0x46060a NOT %RCX |
(576) 0x46060d MOV (%R9,%R14,1),%R11 |
(576) 0x460611 MOV %RCX,(%R11,%RSI,8) |
(576) 0x460615 INC %RSI |
(576) 0x460618 MOV %RDI,(%R10) |
(576) 0x46061b JMP 4603ba |
(576) 0x460620 MOV %RCX,%R10 |
(576) 0x460623 NOT %R10 |
(576) 0x460626 LEA (%R12,%R10,8),%R11 |
(576) 0x46062a CMP %RDI,(%R11) |
(576) 0x46062d JE 46038f |
(576) 0x460633 MOV -0x90(%RBP),%R9 |
(576) 0x46063a NOT %RCX |
(576) 0x46063d MOV (%R9,%R14,1),%R10 |
(576) 0x460641 MOV %RCX,(%R10,%RSI,8) |
(576) 0x460645 INC %RSI |
(576) 0x460648 MOV %RDI,(%R11) |
(576) 0x46064b JMP 46038f |
(578) 0x460650 MOV -0x90(%RBP),%R11 |
(578) 0x460657 MOV (%R11),%R8 |
(578) 0x46065a JMP 45ff80 |
(576) 0x460660 MOV %RCX,%R11 |
(576) 0x460663 NOT %R11 |
(576) 0x460666 LEA (%R12,%R11,8),%R10 |
(576) 0x46066a CMP %RDI,(%R10) |
(576) 0x46066d JE 460364 |
(576) 0x460673 MOV -0x90(%RBP),%R9 |
(576) 0x46067a NOT %RCX |
(576) 0x46067d MOV (%R9,%R14,1),%R11 |
(576) 0x460681 MOV %RCX,(%R11,%RSI,8) |
(576) 0x460685 INC %RSI |
(576) 0x460688 MOV %RDI,(%R10) |
(576) 0x46068b JMP 460364 |
/beegfs/hackathon/users/eoseret/qaas_runs/170-859-5251/intel/AMG/build/AMG/AMG/parcsr_ls/par_multi_interp.c: 1072 - 1125 |
-------------------------------------------------------------------------------- |
1072: for (i=thread_start; i < thread_stop; i++) |
1073: { |
1074: i1 = pass_array[i]; |
1075: for (j=S_diag_i[i1]; j < S_diag_i[i1+1]; j++) |
1076: { |
1077: j1 = S_diag_j[j]; |
1078: if (assigned[j1] == pass-1) |
1079: { |
1080: j_start = P_diag_start[j1]; |
1081: j_end = j_start+P_diag_i[j1+1]; |
1082: for (k=j_start; k < j_end; k++) |
1083: { |
1084: k1 = P_diag_pass[pass-1][k]; |
1085: if (P_marker[k1] != -i1-1) |
1086: { |
1087: P_diag_pass[pass][cnt_nz++] = k1; |
1088: P_marker[k1] = -i1-1; |
1089: } |
1090: } |
1091: j_start = P_offd_start[j1]; |
1092: j_end = j_start+P_offd_i[j1+1]; |
1093: for (k=j_start; k < j_end; k++) |
1094: { |
1095: k1 = P_offd_pass[pass-1][k]; |
1096: if (P_marker_offd[k1] != -i1-1) |
1097: { |
1098: P_offd_pass[pass][cnt_nz_offd++] = k1; |
1099: P_marker_offd[k1] = -i1-1; |
1100: } |
1101: } |
1102: } |
1103: } |
1104: for (j=S_offd_i[i1]; j < S_offd_i[i1+1]; j++) |
1105: { |
1106: j1 = S_offd_j[j]; |
1107: if (assigned_offd[j1] == pass-1) |
1108: { |
1109: j_start = Pext_start[j1]; |
1110: j_end = j_start+Pext_i[j1+1]; |
1111: for (k=j_start; k < j_end; k++) |
1112: { |
1113: k1 = Pext_pass[pass][k]; |
1114: if (k1 < 0) |
1115: { |
1116: if (P_marker[-k1-1] != -i1-1) |
1117: { |
1118: P_diag_pass[pass][cnt_nz++] = -k1-1; |
1119: P_marker[-k1-1] = -i1-1; |
1120: } |
1121: } |
1122: else if (P_marker_offd[k1] != -i1-1) |
1123: { |
1124: P_offd_pass[pass][cnt_nz_offd++] = k1; |
1125: P_marker_offd[k1] = -i1-1; |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.00 |
CQA speedup if FP arith vectorized | 1.00 |
CQA speedup if fully vectorized | 4.87 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.30 |
Bottlenecks | P5, P6, P7, |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source | par_multi_interp.c:1072-1075,par_multi_interp.c:1104-1104,par_multi_interp.c:1122-1122 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 9.33 |
CQA cycles if no scalar integer | 9.33 |
CQA cycles if FP arith vectorized | 9.33 |
CQA cycles if fully vectorized | 1.92 |
Front-end cycles | 7.17 |
DIV/SQRT cycles | 2.75 |
P0 cycles | 2.75 |
P1 cycles | 2.50 |
P2 cycles | 2.50 |
P3 cycles | 2.50 |
P4 cycles | 9.33 |
P5 cycles | 9.33 |
P6 cycles | 9.33 |
P7 cycles | 0.00 |
P8 cycles | 0.00 |
P9 cycles | 0.00 |
P10 cycles | 0.00 |
P11 cycles | 0.00 |
P12 cycles | 0.00 |
P13 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | NA |
Stall cycles (UFS) | NA |
Nb insns | 45.00 |
Nb uops | 43.00 |
Nb loads | 19.00 |
Nb stores | 10.00 |
Nb stack references | 12.00 |
FLOP/cycle | 0.00 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 24.86 |
Bytes prefetched | 0.00 |
Bytes loaded | 152.00 |
Bytes stored | 80.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 0.00 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | NA |
Vectorization ratio add_sub | NA |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 0.00 |
Vector-efficiency ratio all | 12.50 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | NA |
Vector-efficiency ratio add_sub | NA |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 12.50 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.00 |
CQA speedup if FP arith vectorized | 1.00 |
CQA speedup if fully vectorized | 4.87 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.30 |
Bottlenecks | P5, P6, P7, |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source | par_multi_interp.c:1072-1075,par_multi_interp.c:1104-1104,par_multi_interp.c:1122-1122 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 9.33 |
CQA cycles if no scalar integer | 9.33 |
CQA cycles if FP arith vectorized | 9.33 |
CQA cycles if fully vectorized | 1.92 |
Front-end cycles | 7.17 |
DIV/SQRT cycles | 2.75 |
P0 cycles | 2.75 |
P1 cycles | 2.50 |
P2 cycles | 2.50 |
P3 cycles | 2.50 |
P4 cycles | 9.33 |
P5 cycles | 9.33 |
P6 cycles | 9.33 |
P7 cycles | 0.00 |
P8 cycles | 0.00 |
P9 cycles | 0.00 |
P10 cycles | 0.00 |
P11 cycles | 0.00 |
P12 cycles | 0.00 |
P13 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | NA |
Stall cycles (UFS) | NA |
Nb insns | 45.00 |
Nb uops | 43.00 |
Nb loads | 19.00 |
Nb stores | 10.00 |
Nb stack references | 12.00 |
FLOP/cycle | 0.00 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 24.86 |
Bytes prefetched | 0.00 |
Bytes loaded | 152.00 |
Bytes stored | 80.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 0.00 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | NA |
Vectorization ratio add_sub | NA |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 0.00 |
Vector-efficiency ratio all | 12.50 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | NA |
Vector-efficiency ratio add_sub | NA |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 12.50 |
Path / |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source file and lines | par_multi_interp.c:1072-1125 |
Module | exec |
nb instructions | 45 |
nb uops | 43 |
loop length | 228 |
used x86 registers | 10 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 12 |
micro-operation queue | 7.17 cycles |
front end | 7.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.75 | 2.75 | 2.50 | 2.50 | 2.50 | 9.33 | 9.33 | 9.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 2.75 | 2.75 | 2.50 | 2.50 | 2.50 | 9.33 | 9.33 | 9.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 7.17 |
Dispatch | 9.33 |
Overall L1 | 9.33 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0xb0(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R13,%RDI,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x8(,%RDI,8),%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%R8,%RDI,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R11,%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
NOT %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R8,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%R8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R8,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JGE 460280 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x1110> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RDI,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x88(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JMP 45ff91 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xe21> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0xc0(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R13,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xe0(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0xc8(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RCX,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
NOT %RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RCX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 460552 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x13e2> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x88(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R10,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0xd8(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JMP 4602cc <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x115c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x90(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INCQ -0x70(%RBP) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RDI,-0xb8(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JG 45ff20 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xdb0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source file and lines | par_multi_interp.c:1072-1125 |
Module | exec |
nb instructions | 45 |
nb uops | 43 |
loop length | 228 |
used x86 registers | 10 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 12 |
micro-operation queue | 7.17 cycles |
front end | 7.17 cycles |
ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.75 | 2.75 | 2.50 | 2.50 | 2.50 | 9.33 | 9.33 | 9.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
cycles | 2.75 | 2.75 | 2.50 | 2.50 | 2.50 | 9.33 | 9.33 | 9.33 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 | 0.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 7.17 |
Dispatch | 9.33 |
Overall L1 | 9.33 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | ALU0/BRU0 | ALU1 | ALU2 | ALU3 | BRU1 | AGU0 | AGU1 | AGU2 | FP0 | FP1 | FP2 | FP3 | FP4 | FP5 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0xb0(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%R13,%RDI,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
LEA 0x8(,%RDI,8),%R11 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV (%R8,%RDI,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RDI,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R11,%R8 | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
NOT %RAX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %R8,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%R8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
CMP %R8,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JGE 460280 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x1110> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %RDI,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x88(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R11,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
JMP 45ff91 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xe21> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPW (%RAX,%RAX,1) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0xc0(%RBP),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R13,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0xe0(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0xc8(%RBP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV (%RCX,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
ADD %R11,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
NOT %RDI | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOV %RCX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV (%RCX),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RAX,%RCX | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
JLE 460552 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x13e2> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x88(%RBP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV %R10,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0xd8(%RBP),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
JMP 4602cc <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x115c> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
NOPL (%RAX) | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.09 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 4 | 0.50 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
MOV -0x90(%RBP),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
INCQ -0x70(%RBP) | 2 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.33 |
CMP %RDI,-0xb8(%RBP) | 1 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
JG 45ff20 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xdb0> | 1 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50-1 |