Loop Id: 852 | Module: libparcsr_ls.so | Source: par_multi_interp.c:1072-1125 | Coverage: 0.14% |
---|
Loop Id: 852 | Module: libparcsr_ls.so | Source: par_multi_interp.c:1072-1125 | Coverage: 0.14% |
---|
0x810f0 MOV -0xb0(%RBP),%R13 |
0x810f7 MOV -0x70(%RBP),%RCX |
0x810fb MOV -0xd0(%RBP),%R8 |
0x81102 MOV (%R13,%RCX,8),%RDI |
0x81107 LEA 0x8(,%RDI,8),%RDX |
0x8110f MOV (%R8,%RDI,8),%R11 |
0x81113 MOV %RDI,%RAX |
0x81116 ADD %RDX,%R8 |
0x81119 NOT %RAX |
0x8111c MOV %R8,-0x90(%RBP) |
0x81123 MOV (%R8),%R8 |
0x81126 MOV %R11,-0x38(%RBP) |
0x8112a CMP %R8,%R11 |
0x8112d JGE 81450 |
0x81133 MOV %RDI,-0xe0(%RBP) |
0x8113a MOV %RBX,%R13 |
0x8113d MOV -0x88(%RBP),%RDI |
0x81144 MOV %RDX,-0xc0(%RBP) |
0x8114b JMP 81161 |
(855) 0x81150 INCQ -0x38(%RBP) |
(855) 0x81154 MOV -0x38(%RBP),%RDX |
(855) 0x81158 CMP %R8,%RDX |
(855) 0x8115b JGE 81438 |
(855) 0x81161 MOV -0x40(%RBP),%RDX |
(855) 0x81165 MOV -0x38(%RBP),%RBX |
(855) 0x81169 MOV (%RDX,%RBX,8),%RCX |
(855) 0x8116d MOV -0x48(%RBP),%RDX |
(855) 0x81171 LEA (,%RCX,8),%R11 |
(855) 0x81179 CMP %R13,(%RDX,%RCX,8) |
(855) 0x8117d JNE 81150 |
(855) 0x8117f MOV -0x80(%RBP),%R8 |
(855) 0x81183 MOV -0x60(%RBP),%RBX |
(855) 0x81187 MOV (%R8,%RCX,8),%R8 |
(855) 0x8118b MOV 0x8(%RBX,%R11,1),%RBX |
(855) 0x81190 ADD %R8,%RBX |
(855) 0x81193 CMP %RBX,%R8 |
(855) 0x81196 JGE 812f4 |
(855) 0x8119c MOV -0x8(%R10,%R14,1),%RDX |
(855) 0x811a1 LEA (%RDX,%RBX,8),%RBX |
(855) 0x811a5 LEA (%RDX,%R8,8),%R8 |
(855) 0x811a9 MOV %RBX,-0x68(%RBP) |
(855) 0x811ad SUB %R8,%RBX |
(855) 0x811b0 SUB $0x8,%RBX |
(855) 0x811b4 SHR $0x3,%RBX |
(855) 0x811b8 INC %RBX |
(855) 0x811bb AND $0x3,%EBX |
(855) 0x811be JE 81267 |
(855) 0x811c4 CMP $0x1,%RBX |
(855) 0x811c8 JE 8122e |
(855) 0x811ca CMP $0x2,%RBX |
(855) 0x811ce JE 811ff |
(855) 0x811d0 MOV (%R8),%RDX |
(855) 0x811d3 MOV %RDX,%RBX |
(855) 0x811d6 LEA (%R12,%RDX,8),%RDX |
(855) 0x811da MOV %RDX,-0x88(%RBP) |
(855) 0x811e1 CMP %RAX,(%RDX) |
(855) 0x811e4 JE 811fb |
(855) 0x811e6 MOV (%R10,%R14,1),%RDX |
(855) 0x811ea MOV %RBX,(%RDX,%RSI,8) |
(855) 0x811ee MOV -0x88(%RBP),%RBX |
(855) 0x811f5 INC %RSI |
(855) 0x811f8 MOV %RAX,(%RBX) |
(855) 0x811fb ADD $0x8,%R8 |
(855) 0x811ff MOV (%R8),%RDX |
(855) 0x81202 MOV %RDX,%RBX |
(855) 0x81205 LEA (%R12,%RDX,8),%RDX |
(855) 0x81209 MOV %RDX,-0x88(%RBP) |
(855) 0x81210 CMP %RAX,(%RDX) |
(855) 0x81213 JE 8122a |
(855) 0x81215 MOV (%R10,%R14,1),%RDX |
(855) 0x81219 MOV %RBX,(%RDX,%RSI,8) |
(855) 0x8121d MOV -0x88(%RBP),%RBX |
(855) 0x81224 INC %RSI |
(855) 0x81227 MOV %RAX,(%RBX) |
(855) 0x8122a ADD $0x8,%R8 |
(855) 0x8122e MOV (%R8),%RDX |
(855) 0x81231 MOV %RDX,%RBX |
(855) 0x81234 LEA (%R12,%RDX,8),%RDX |
(855) 0x81238 MOV %RDX,-0x88(%RBP) |
(855) 0x8123f CMP %RAX,(%RDX) |
(855) 0x81242 JE 81259 |
(855) 0x81244 MOV (%R10,%R14,1),%RDX |
(855) 0x81248 MOV %RBX,(%RDX,%RSI,8) |
(855) 0x8124c MOV -0x88(%RBP),%RBX |
(855) 0x81253 INC %RSI |
(855) 0x81256 MOV %RAX,(%RBX) |
(855) 0x81259 ADD $0x8,%R8 |
(855) 0x8125d CMP %R8,-0x68(%RBP) |
(855) 0x81261 JE 812f4 |
(855) 0x81267 MOV %RCX,-0x88(%RBP) |
(855) 0x8126e MOV %RDI,%RBX |
(857) 0x81271 MOV (%R8),%RDI |
(857) 0x81274 LEA (%R12,%RDI,8),%RDX |
(857) 0x81278 CMP %RAX,(%RDX) |
(857) 0x8127b JE 8128b |
(857) 0x8127d MOV (%R10,%R14,1),%RCX |
(857) 0x81281 MOV %RDI,(%RCX,%RSI,8) |
(857) 0x81285 INC %RSI |
(857) 0x81288 MOV %RAX,(%RDX) |
(857) 0x8128b LEA 0x8(%R8),%RDX |
(857) 0x8128f MOV 0x8(%R8),%R8 |
(857) 0x81293 LEA (%R12,%R8,8),%RDI |
(857) 0x81297 CMP %RAX,(%RDI) |
(857) 0x8129a JE 812aa |
(857) 0x8129c MOV (%R10,%R14,1),%RCX |
(857) 0x812a0 MOV %R8,(%RCX,%RSI,8) |
(857) 0x812a4 INC %RSI |
(857) 0x812a7 MOV %RAX,(%RDI) |
(857) 0x812aa MOV 0x8(%RDX),%R8 |
(857) 0x812ae LEA (%R12,%R8,8),%RDI |
(857) 0x812b2 CMP %RAX,(%RDI) |
(857) 0x812b5 JE 812c5 |
(857) 0x812b7 MOV (%R10,%R14,1),%RCX |
(857) 0x812bb MOV %R8,(%RCX,%RSI,8) |
(857) 0x812bf INC %RSI |
(857) 0x812c2 MOV %RAX,(%RDI) |
(857) 0x812c5 MOV 0x10(%RDX),%R8 |
(857) 0x812c9 LEA (%R12,%R8,8),%RDI |
(857) 0x812cd CMP %RAX,(%RDI) |
(857) 0x812d0 JE 812e0 |
(857) 0x812d2 MOV (%R10,%R14,1),%RCX |
(857) 0x812d6 MOV %R8,(%RCX,%RSI,8) |
(857) 0x812da INC %RSI |
(857) 0x812dd MOV %RAX,(%RDI) |
(857) 0x812e0 LEA 0x18(%RDX),%R8 |
(857) 0x812e4 CMP %R8,-0x68(%RBP) |
(857) 0x812e8 JNE 81271 |
(855) 0x812ea MOV -0x88(%RBP),%RCX |
(855) 0x812f1 MOV %RBX,%RDI |
(855) 0x812f4 MOV -0x78(%RBP),%RBX |
(855) 0x812f8 MOV -0x58(%RBP),%RDX |
(855) 0x812fc MOV (%RBX,%RCX,8),%RCX |
(855) 0x81300 MOV 0x8(%RDX,%R11,1),%R8 |
(855) 0x81305 ADD %RCX,%R8 |
(855) 0x81308 CMP %R8,%RCX |
(855) 0x8130b JGE 81830 |
(855) 0x81311 MOV -0x8(%R9,%R14,1),%RBX |
(855) 0x81316 LEA (%RBX,%RCX,8),%RCX |
(855) 0x8131a LEA (%RBX,%R8,8),%RBX |
(855) 0x8131e MOV %RBX,%RDX |
(855) 0x81321 SUB %RCX,%RDX |
(855) 0x81324 SUB $0x8,%RDX |
(855) 0x81328 SHR $0x3,%RDX |
(855) 0x8132c INC %RDX |
(855) 0x8132f AND $0x3,%EDX |
(855) 0x81332 JE 8139f |
(855) 0x81334 CMP $0x1,%RDX |
(855) 0x81338 JE 8137c |
(855) 0x8133a CMP $0x2,%RDX |
(855) 0x8133e JE 8135e |
(855) 0x81340 MOV (%RCX),%R11 |
(855) 0x81343 LEA (%R15,%R11,8),%R8 |
(855) 0x81347 CMP %RAX,(%R8) |
(855) 0x8134a JE 8135a |
(855) 0x8134c MOV (%R9,%R14,1),%RDX |
(855) 0x81350 MOV %R11,(%RDX,%RDI,8) |
(855) 0x81354 INC %RDI |
(855) 0x81357 MOV %RAX,(%R8) |
(855) 0x8135a ADD $0x8,%RCX |
(855) 0x8135e MOV (%RCX),%R11 |
(855) 0x81361 LEA (%R15,%R11,8),%R8 |
(855) 0x81365 CMP %RAX,(%R8) |
(855) 0x81368 JE 81378 |
(855) 0x8136a MOV (%R9,%R14,1),%RDX |
(855) 0x8136e MOV %R11,(%RDX,%RDI,8) |
(855) 0x81372 INC %RDI |
(855) 0x81375 MOV %RAX,(%R8) |
(855) 0x81378 ADD $0x8,%RCX |
(855) 0x8137c MOV (%RCX),%R11 |
(855) 0x8137f LEA (%R15,%R11,8),%R8 |
(855) 0x81383 CMP %RAX,(%R8) |
(855) 0x81386 JE 81396 |
(855) 0x81388 MOV (%R9,%R14,1),%RDX |
(855) 0x8138c MOV %R11,(%RDX,%RDI,8) |
(855) 0x81390 INC %RDI |
(855) 0x81393 MOV %RAX,(%R8) |
(855) 0x81396 ADD $0x8,%RCX |
(855) 0x8139a CMP %RBX,%RCX |
(855) 0x8139d JE 81417 |
(856) 0x8139f MOV (%RCX),%R8 |
(856) 0x813a2 LEA (%R15,%R8,8),%RDX |
(856) 0x813a6 CMP %RAX,(%RDX) |
(856) 0x813a9 JE 813b9 |
(856) 0x813ab MOV (%R9,%R14,1),%R11 |
(856) 0x813af MOV %R8,(%R11,%RDI,8) |
(856) 0x813b3 INC %RDI |
(856) 0x813b6 MOV %RAX,(%RDX) |
(856) 0x813b9 MOV 0x8(%RCX),%R8 |
(856) 0x813bd LEA 0x8(%RCX),%RDX |
(856) 0x813c1 LEA (%R15,%R8,8),%RCX |
(856) 0x813c5 CMP %RAX,(%RCX) |
(856) 0x813c8 JE 813d8 |
(856) 0x813ca MOV (%R9,%R14,1),%R11 |
(856) 0x813ce MOV %R8,(%R11,%RDI,8) |
(856) 0x813d2 INC %RDI |
(856) 0x813d5 MOV %RAX,(%RCX) |
(856) 0x813d8 MOV 0x8(%RDX),%R8 |
(856) 0x813dc LEA (%R15,%R8,8),%RCX |
(856) 0x813e0 CMP %RAX,(%RCX) |
(856) 0x813e3 JE 813f3 |
(856) 0x813e5 MOV (%R9,%R14,1),%R11 |
(856) 0x813e9 MOV %R8,(%R11,%RDI,8) |
(856) 0x813ed INC %RDI |
(856) 0x813f0 MOV %RAX,(%RCX) |
(856) 0x813f3 MOV 0x10(%RDX),%R8 |
(856) 0x813f7 LEA (%R15,%R8,8),%RCX |
(856) 0x813fb CMP %RAX,(%RCX) |
(856) 0x813fe JE 8140e |
(856) 0x81400 MOV (%R9,%R14,1),%R11 |
(856) 0x81404 MOV %R8,(%R11,%RDI,8) |
(856) 0x81408 INC %RDI |
(856) 0x8140b MOV %RAX,(%RCX) |
(856) 0x8140e LEA 0x18(%RDX),%RCX |
(856) 0x81412 CMP %RBX,%RCX |
(856) 0x81415 JNE 8139f |
(855) 0x81417 INCQ -0x38(%RBP) |
(855) 0x8141b MOV -0x90(%RBP),%RBX |
(855) 0x81422 MOV (%RBX),%R8 |
(855) 0x81425 MOV -0x38(%RBP),%RDX |
(855) 0x81429 CMP %R8,%RDX |
(855) 0x8142c JL 81161 |
0x81432 NOPW (%RAX,%RAX,1) |
0x81438 MOV %RDI,-0x88(%RBP) |
0x8143f MOV -0xc0(%RBP),%RDX |
0x81446 MOV %R13,%RBX |
0x81449 MOV -0xe0(%RBP),%RDI |
0x81450 MOV -0xc8(%RBP),%R11 |
0x81457 MOV (%R11,%RDI,8),%RAX |
0x8145b ADD %RDX,%R11 |
0x8145e NOT %RDI |
0x81461 MOV (%R11),%RCX |
0x81464 MOV %R11,-0xc0(%RBP) |
0x8146b CMP %RAX,%RCX |
0x8146e JLE 8172a |
0x81474 MOV -0x88(%RBP),%R8 |
0x8147b MOV -0xd8(%RBP),%R13 |
0x81482 MOV %R9,-0x68(%RBP) |
0x81486 MOV %R10,-0x90(%RBP) |
0x8148d JMP 8149c |
(853) 0x81490 INC %RAX |
(853) 0x81493 CMP %RCX,%RAX |
(853) 0x81496 JGE 81718 |
(853) 0x8149c MOV -0x50(%RBP),%R9 |
(853) 0x814a0 MOV (%R9,%RAX,8),%RDX |
(853) 0x814a4 LEA (,%RDX,8),%R11 |
(853) 0x814ac CMP %RBX,(%R13,%RDX,8) |
(853) 0x814b1 JNE 81490 |
(853) 0x814b3 MOV -0xa0(%RBP),%R10 |
(853) 0x814ba MOV -0x98(%RBP),%R9 |
(853) 0x814c1 MOV (%R10,%RDX,8),%RDX |
(853) 0x814c5 MOV 0x8(%R9,%R11,1),%R11 |
(853) 0x814ca ADD %RDX,%R11 |
(853) 0x814cd CMP %R11,%RDX |
(853) 0x814d0 JGE 81490 |
(853) 0x814d2 MOV -0xa8(%RBP),%RCX |
(853) 0x814d9 MOV (%RCX,%R14,1),%R10 |
(853) 0x814dd LEA (%R10,%R11,8),%R9 |
(853) 0x814e1 LEA (%R10,%RDX,8),%RDX |
(853) 0x814e5 MOV %R9,-0x38(%RBP) |
(853) 0x814e9 SUB %RDX,%R9 |
(853) 0x814ec SUB $0x8,%R9 |
(853) 0x814f0 SHR $0x3,%R9 |
(853) 0x814f4 INC %R9 |
(853) 0x814f7 AND $0x3,%R9D |
(853) 0x814fb JE 8159b |
(853) 0x81501 CMP $0x1,%R9 |
(853) 0x81505 JE 81563 |
(853) 0x81507 CMP $0x2,%R9 |
(853) 0x8150b JE 81538 |
(853) 0x8150d MOV (%RDX),%RCX |
(853) 0x81510 TEST %RCX,%RCX |
(853) 0x81513 JS 81840 |
(853) 0x81519 LEA (%R15,%RCX,8),%R11 |
(853) 0x8151d CMP %RDI,(%R11) |
(853) 0x81520 JE 81534 |
(853) 0x81522 MOV -0x68(%RBP),%R10 |
(853) 0x81526 MOV (%R10,%R14,1),%R9 |
(853) 0x8152a MOV %RCX,(%R9,%R8,8) |
(853) 0x8152e INC %R8 |
(853) 0x81531 MOV %RDI,(%R11) |
(853) 0x81534 ADD $0x8,%RDX |
(853) 0x81538 MOV (%RDX),%RCX |
(853) 0x8153b TEST %RCX,%RCX |
(853) 0x8153e JS 81800 |
(853) 0x81544 LEA (%R15,%RCX,8),%R10 |
(853) 0x81548 CMP %RDI,(%R10) |
(853) 0x8154b JE 8155f |
(853) 0x8154d MOV -0x68(%RBP),%R9 |
(853) 0x81551 MOV (%R9,%R14,1),%R11 |
(853) 0x81555 MOV %RCX,(%R11,%R8,8) |
(853) 0x81559 INC %R8 |
(853) 0x8155c MOV %RDI,(%R10) |
(853) 0x8155f ADD $0x8,%RDX |
(853) 0x81563 MOV (%RDX),%RCX |
(853) 0x81566 TEST %RCX,%RCX |
(853) 0x81569 JS 817c8 |
(853) 0x8156f LEA (%R15,%RCX,8),%R11 |
(853) 0x81573 CMP %RDI,(%R11) |
(853) 0x81576 JE 8158a |
(853) 0x81578 MOV -0x68(%RBP),%R9 |
(853) 0x8157c MOV (%R9,%R14,1),%R10 |
(853) 0x81580 MOV %RCX,(%R10,%R8,8) |
(853) 0x81584 INC %R8 |
(853) 0x81587 MOV %RDI,(%R11) |
(853) 0x8158a MOV -0x38(%RBP),%RCX |
(853) 0x8158e ADD $0x8,%RDX |
(853) 0x81592 CMP %RCX,%RDX |
(853) 0x81595 JE 816fd |
(853) 0x8159b MOV -0x68(%RBP),%R9 |
(853) 0x8159f MOV -0x90(%RBP),%R10 |
(853) 0x815a6 MOV %RAX,-0x88(%RBP) |
(853) 0x815ad JMP 81620 |
(854) 0x815b0 LEA (%R15,%RDX,8),%R11 |
(854) 0x815b4 CMP %RDI,(%R11) |
(854) 0x815b7 JE 815c7 |
(854) 0x815b9 MOV (%R9,%R14,1),%RAX |
(854) 0x815bd MOV %RDX,(%RAX,%R8,8) |
(854) 0x815c1 INC %R8 |
(854) 0x815c4 MOV %RDI,(%R11) |
(854) 0x815c7 MOV 0x8(%RCX),%RDX |
(854) 0x815cb TEST %RDX,%RDX |
(854) 0x815ce JS 81685 |
(854) 0x815d4 LEA (%R15,%RDX,8),%R11 |
(854) 0x815d8 CMP %RDI,(%R11) |
(854) 0x815db JE 815eb |
(854) 0x815dd MOV (%R9,%R14,1),%RAX |
(854) 0x815e1 MOV %RDX,(%RAX,%R8,8) |
(854) 0x815e5 INC %R8 |
(854) 0x815e8 MOV %RDI,(%R11) |
(854) 0x815eb MOV 0x10(%RCX),%RDX |
(854) 0x815ef TEST %RDX,%RDX |
(854) 0x815f2 JS 816b6 |
(854) 0x815f8 LEA (%R15,%RDX,8),%R11 |
(854) 0x815fc CMP %RDI,(%R11) |
(854) 0x815ff JE 8160f |
(854) 0x81601 MOV (%R9,%R14,1),%RAX |
(854) 0x81605 MOV %RDX,(%RAX,%R8,8) |
(854) 0x81609 INC %R8 |
(854) 0x8160c MOV %RDI,(%R11) |
(854) 0x8160f LEA 0x18(%RCX),%RDX |
(854) 0x81613 MOV -0x38(%RBP),%RCX |
(854) 0x81617 CMP %RCX,%RDX |
(854) 0x8161a JE 816eb |
(854) 0x81620 MOV (%RDX),%RCX |
(854) 0x81623 TEST %RCX,%RCX |
(854) 0x81626 JS 81798 |
(854) 0x8162c LEA (%R15,%RCX,8),%R11 |
(854) 0x81630 CMP %RDI,(%R11) |
(854) 0x81633 JE 81643 |
(854) 0x81635 MOV (%R9,%R14,1),%RAX |
(854) 0x81639 MOV %RCX,(%RAX,%R8,8) |
(854) 0x8163d INC %R8 |
(854) 0x81640 MOV %RDI,(%R11) |
(854) 0x81643 LEA 0x8(%RDX),%RCX |
(854) 0x81647 MOV 0x8(%RDX),%RDX |
(854) 0x8164b TEST %RDX,%RDX |
(854) 0x8164e JNS 815b0 |
(854) 0x81654 MOV %RDX,%R11 |
(854) 0x81657 NOT %R11 |
(854) 0x8165a LEA (%R12,%R11,8),%R11 |
(854) 0x8165e CMP %RDI,(%R11) |
(854) 0x81661 JE 815c7 |
(854) 0x81667 MOV (%R10,%R14,1),%RAX |
(854) 0x8166b NOT %RDX |
(854) 0x8166e MOV %RDX,(%RAX,%RSI,8) |
(854) 0x81672 INC %RSI |
(854) 0x81675 MOV %RDI,(%R11) |
(854) 0x81678 MOV 0x8(%RCX),%RDX |
(854) 0x8167c TEST %RDX,%RDX |
(854) 0x8167f JNS 815d4 |
(854) 0x81685 MOV %RDX,%R11 |
(854) 0x81688 NOT %R11 |
(854) 0x8168b LEA (%R12,%R11,8),%R11 |
(854) 0x8168f CMP %RDI,(%R11) |
(854) 0x81692 JE 815eb |
(854) 0x81698 MOV (%R10,%R14,1),%RAX |
(854) 0x8169c NOT %RDX |
(854) 0x8169f MOV %RDX,(%RAX,%RSI,8) |
(854) 0x816a3 INC %RSI |
(854) 0x816a6 MOV %RDI,(%R11) |
(854) 0x816a9 MOV 0x10(%RCX),%RDX |
(854) 0x816ad TEST %RDX,%RDX |
(854) 0x816b0 JNS 815f8 |
(854) 0x816b6 MOV %RDX,%R11 |
(854) 0x816b9 NOT %R11 |
(854) 0x816bc LEA (%R12,%R11,8),%R11 |
(854) 0x816c0 CMP %RDI,(%R11) |
(854) 0x816c3 JE 8160f |
(854) 0x816c9 MOV (%R10,%R14,1),%RAX |
(854) 0x816cd NOT %RDX |
(854) 0x816d0 MOV %RDX,(%RAX,%RSI,8) |
(854) 0x816d4 LEA 0x18(%RCX),%RDX |
(854) 0x816d8 MOV -0x38(%RBP),%RCX |
(854) 0x816dc INC %RSI |
(854) 0x816df MOV %RDI,(%R11) |
(854) 0x816e2 CMP %RCX,%RDX |
(854) 0x816e5 JNE 81620 |
(853) 0x816eb MOV %R9,-0x68(%RBP) |
(853) 0x816ef MOV -0x88(%RBP),%RAX |
(853) 0x816f6 MOV %R10,-0x90(%RBP) |
(853) 0x816fd MOV -0xc0(%RBP),%R9 |
(853) 0x81704 INC %RAX |
(853) 0x81707 MOV (%R9),%RCX |
(853) 0x8170a CMP %RCX,%RAX |
(853) 0x8170d JL 8149c |
0x81713 NOPL (%RAX,%RAX,1) |
0x81718 MOV -0x68(%RBP),%R9 |
0x8171c MOV -0x90(%RBP),%R10 |
0x81723 MOV %R8,-0x88(%RBP) |
0x8172a INCQ -0x70(%RBP) |
0x8172e MOV -0x70(%RBP),%RDI |
0x81732 CMP %RDI,-0xb8(%RBP) |
0x81739 JG 810f0 |
(854) 0x81798 MOV %RCX,%R11 |
(854) 0x8179b NOT %R11 |
(854) 0x8179e LEA (%R12,%R11,8),%R11 |
(854) 0x817a2 CMP %RDI,(%R11) |
(854) 0x817a5 JE 81643 |
(854) 0x817ab MOV (%R10,%R14,1),%RAX |
(854) 0x817af NOT %RCX |
(854) 0x817b2 MOV %RCX,(%RAX,%RSI,8) |
(854) 0x817b6 INC %RSI |
(854) 0x817b9 MOV %RDI,(%R11) |
(854) 0x817bc JMP 81643 |
(853) 0x817c8 MOV %RCX,%R11 |
(853) 0x817cb NOT %R11 |
(853) 0x817ce LEA (%R12,%R11,8),%R10 |
(853) 0x817d2 CMP %RDI,(%R10) |
(853) 0x817d5 JE 8158a |
(853) 0x817db MOV -0x90(%RBP),%R9 |
(853) 0x817e2 NOT %RCX |
(853) 0x817e5 MOV (%R9,%R14,1),%R11 |
(853) 0x817e9 MOV %RCX,(%R11,%RSI,8) |
(853) 0x817ed INC %RSI |
(853) 0x817f0 MOV %RDI,(%R10) |
(853) 0x817f3 JMP 8158a |
(853) 0x81800 MOV %RCX,%R10 |
(853) 0x81803 NOT %R10 |
(853) 0x81806 LEA (%R12,%R10,8),%R11 |
(853) 0x8180a CMP %RDI,(%R11) |
(853) 0x8180d JE 8155f |
(853) 0x81813 MOV -0x90(%RBP),%R9 |
(853) 0x8181a NOT %RCX |
(853) 0x8181d MOV (%R9,%R14,1),%R10 |
(853) 0x81821 MOV %RCX,(%R10,%RSI,8) |
(853) 0x81825 INC %RSI |
(853) 0x81828 MOV %RDI,(%R11) |
(853) 0x8182b JMP 8155f |
(855) 0x81830 MOV -0x90(%RBP),%R11 |
(855) 0x81837 MOV (%R11),%R8 |
(855) 0x8183a JMP 81150 |
(853) 0x81840 MOV %RCX,%R11 |
(853) 0x81843 NOT %R11 |
(853) 0x81846 LEA (%R12,%R11,8),%R10 |
(853) 0x8184a CMP %RDI,(%R10) |
(853) 0x8184d JE 81534 |
(853) 0x81853 MOV -0x90(%RBP),%R9 |
(853) 0x8185a NOT %RCX |
(853) 0x8185d MOV (%R9,%R14,1),%R11 |
(853) 0x81861 MOV %RCX,(%R11,%RSI,8) |
(853) 0x81865 INC %RSI |
(853) 0x81868 MOV %RDI,(%R10) |
(853) 0x8186b JMP 81534 |
/home/eoseret/qaas_runs_CPU_9468/171-716-5699/intel/AMG/build/AMG/AMG/parcsr_ls/par_multi_interp.c: 1072 - 1125 |
-------------------------------------------------------------------------------- |
1072: for (i=thread_start; i < thread_stop; i++) |
1073: { |
1074: i1 = pass_array[i]; |
1075: for (j=S_diag_i[i1]; j < S_diag_i[i1+1]; j++) |
1076: { |
1077: j1 = S_diag_j[j]; |
1078: if (assigned[j1] == pass-1) |
1079: { |
1080: j_start = P_diag_start[j1]; |
1081: j_end = j_start+P_diag_i[j1+1]; |
1082: for (k=j_start; k < j_end; k++) |
1083: { |
1084: k1 = P_diag_pass[pass-1][k]; |
1085: if (P_marker[k1] != -i1-1) |
1086: { |
1087: P_diag_pass[pass][cnt_nz++] = k1; |
1088: P_marker[k1] = -i1-1; |
1089: } |
1090: } |
1091: j_start = P_offd_start[j1]; |
1092: j_end = j_start+P_offd_i[j1+1]; |
1093: for (k=j_start; k < j_end; k++) |
1094: { |
1095: k1 = P_offd_pass[pass-1][k]; |
1096: if (P_marker_offd[k1] != -i1-1) |
1097: { |
1098: P_offd_pass[pass][cnt_nz_offd++] = k1; |
1099: P_marker_offd[k1] = -i1-1; |
1100: } |
1101: } |
1102: } |
1103: } |
1104: for (j=S_offd_i[i1]; j < S_offd_i[i1+1]; j++) |
1105: { |
1106: j1 = S_offd_j[j]; |
1107: if (assigned_offd[j1] == pass-1) |
1108: { |
1109: j_start = Pext_start[j1]; |
1110: j_end = j_start+Pext_i[j1+1]; |
1111: for (k=j_start; k < j_end; k++) |
1112: { |
1113: k1 = Pext_pass[pass][k]; |
1114: if (k1 < 0) |
1115: { |
1116: if (P_marker[-k1-1] != -i1-1) |
1117: { |
1118: P_diag_pass[pass][cnt_nz++] = -k1-1; |
1119: P_marker[-k1-1] = -i1-1; |
1120: } |
1121: } |
1122: else if (P_marker_offd[k1] != -i1-1) |
1123: { |
1124: P_offd_pass[pass][cnt_nz_offd++] = k1; |
1125: P_marker_offd[k1] = -i1-1; |
Path / |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.00 |
CQA speedup if FP arith vectorized | 1.00 |
CQA speedup if fully vectorized | 8.00 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.21 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source | par_multi_interp.c:1072-1075,par_multi_interp.c:1104-1104,par_multi_interp.c:1122-1122 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 7.67 |
CQA cycles if no scalar integer | 7.67 |
CQA cycles if FP arith vectorized | 7.67 |
CQA cycles if fully vectorized | 0.96 |
Front-end cycles | 7.67 |
DIV/SQRT cycles | 2.10 |
P0 cycles | 2.00 |
P1 cycles | 6.33 |
P2 cycles | 6.33 |
P3 cycles | 5.00 |
P4 cycles | 2.00 |
P5 cycles | 1.90 |
P6 cycles | 5.00 |
P7 cycles | 5.00 |
P8 cycles | 5.00 |
P9 cycles | 2.00 |
P10 cycles | 6.33 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 7.86 |
Stall cycles (UFS) | 0.00 |
Nb insns | 45.00 |
Nb uops | 46.00 |
Nb loads | 19.00 |
Nb stores | 10.00 |
Nb stack references | 12.00 |
FLOP/cycle | 0.00 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 30.26 |
Bytes prefetched | 0.00 |
Bytes loaded | 152.00 |
Bytes stored | 80.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 0.00 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | NA |
Vectorization ratio add_sub | NA |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 0.00 |
Vector-efficiency ratio all | 12.50 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | NA |
Vector-efficiency ratio add_sub | NA |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 12.50 |
Metric | Value |
---|---|
CQA speedup if no scalar integer | 1.00 |
CQA speedup if FP arith vectorized | 1.00 |
CQA speedup if fully vectorized | 8.00 |
CQA speedup if no inter-iteration dependency | NA |
CQA speedup if next bottleneck killed | 1.21 |
Bottlenecks | micro-operation queue, |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source | par_multi_interp.c:1072-1075,par_multi_interp.c:1104-1104,par_multi_interp.c:1122-1122 |
Source loop unroll info | NA |
Source loop unroll confidence level | NA |
Unroll/vectorization loop type | NA |
Unroll factor | NA |
CQA cycles | 7.67 |
CQA cycles if no scalar integer | 7.67 |
CQA cycles if FP arith vectorized | 7.67 |
CQA cycles if fully vectorized | 0.96 |
Front-end cycles | 7.67 |
DIV/SQRT cycles | 2.10 |
P0 cycles | 2.00 |
P1 cycles | 6.33 |
P2 cycles | 6.33 |
P3 cycles | 5.00 |
P4 cycles | 2.00 |
P5 cycles | 1.90 |
P6 cycles | 5.00 |
P7 cycles | 5.00 |
P8 cycles | 5.00 |
P9 cycles | 2.00 |
P10 cycles | 6.33 |
P11 cycles | 0.00 |
Inter-iter dependencies cycles | NA |
FE+BE cycles (UFS) | 7.86 |
Stall cycles (UFS) | 0.00 |
Nb insns | 45.00 |
Nb uops | 46.00 |
Nb loads | 19.00 |
Nb stores | 10.00 |
Nb stack references | 12.00 |
FLOP/cycle | 0.00 |
Nb FLOP add-sub | 0.00 |
Nb FLOP mul | 0.00 |
Nb FLOP fma | 0.00 |
Nb FLOP div | 0.00 |
Nb FLOP rcp | 0.00 |
Nb FLOP sqrt | 0.00 |
Nb FLOP rsqrt | 0.00 |
Bytes/cycle | 30.26 |
Bytes prefetched | 0.00 |
Bytes loaded | 152.00 |
Bytes stored | 80.00 |
Stride 0 | NA |
Stride 1 | NA |
Stride n | NA |
Stride unknown | NA |
Stride indirect | NA |
Vectorization ratio all | 0.00 |
Vectorization ratio load | 0.00 |
Vectorization ratio store | 0.00 |
Vectorization ratio mul | NA |
Vectorization ratio add_sub | NA |
Vectorization ratio fma | NA |
Vectorization ratio div_sqrt | NA |
Vectorization ratio other | 0.00 |
Vector-efficiency ratio all | 12.50 |
Vector-efficiency ratio load | 12.50 |
Vector-efficiency ratio store | 12.50 |
Vector-efficiency ratio mul | NA |
Vector-efficiency ratio add_sub | NA |
Vector-efficiency ratio fma | NA |
Vector-efficiency ratio div_sqrt | NA |
Vector-efficiency ratio other | 12.50 |
Path / |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source file and lines | par_multi_interp.c:1072-1125 |
Module | libparcsr_ls.so |
nb instructions | 45 |
nb uops | 46 |
loop length | 230 |
used x86 registers | 11 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 12 |
micro-operation queue | 7.67 cycles |
front end | 7.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.10 | 2.00 | 6.33 | 6.33 | 5.00 | 2.00 | 1.90 | 5.00 | 5.00 | 5.00 | 2.00 | 6.33 |
cycles | 2.10 | 2.00 | 6.33 | 6.33 | 5.00 | 2.00 | 1.90 | 5.00 | 5.00 | 5.00 | 2.00 | 6.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 7.86 |
Stall cycles | 0.00 |
Front-end | 7.67 |
Dispatch | 6.33 |
Overall L1 | 7.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0xb0(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RCX,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(,%RDI,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R8,%RDI,8),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R8),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R8,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 81450 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x1120> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDI,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x88(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 81161 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xe31> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xc0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0xe0(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOT %RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R11),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 8172a <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x13fa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x88(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd8(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8149c <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x116c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INCQ -0x70(%RBP) | 3 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,-0xb8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JG 810f0 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xdc0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
Function | hypre_BoomerAMGBuildMultipass._omp_fn.5 |
Source file and lines | par_multi_interp.c:1072-1125 |
Module | libparcsr_ls.so |
nb instructions | 45 |
nb uops | 46 |
loop length | 230 |
used x86 registers | 11 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 12 |
micro-operation queue | 7.67 cycles |
front end | 7.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.10 | 2.00 | 6.33 | 6.33 | 5.00 | 2.00 | 1.90 | 5.00 | 5.00 | 5.00 | 2.00 | 6.33 |
cycles | 2.10 | 2.00 | 6.33 | 6.33 | 5.00 | 2.00 | 1.90 | 5.00 | 5.00 | 5.00 | 2.00 | 6.33 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 7.86 |
Stall cycles | 0.00 |
Front-end | 7.67 |
Dispatch | 6.33 |
Overall L1 | 7.67 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 12% |
load | 12% |
store | 12% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
MOV -0xb0(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x70(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd0(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R13,%RCX,8),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(,%RDI,8),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R8,%RDI,8),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
ADD %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R8),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %R8,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 81450 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x1120> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RDI,-0xe0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RBX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x88(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 81161 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xe31> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0xc0(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0xe0(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xc8(%RBP),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%R11,%RDI,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOT %RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV (%R11),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,-0xc0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JLE 8172a <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x13fa> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x88(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0xd8(%RBP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 8149c <hypre_BoomerAMGBuildMultipass._omp_fn.5+0x116c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x68(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x90(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INCQ -0x70(%RBP) | 3 | 0.20 | 0.20 | 0.33 | 0.33 | 0.50 | 0.20 | 0.20 | 0.50 | 0.50 | 0.50 | 0.20 | 0.33 | 1 | 0.50 |
MOV -0x70(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,-0xb8(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
JG 810f0 <hypre_BoomerAMGBuildMultipass._omp_fn.5+0xdc0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |