Function: hypre_IJMatrixSetValuesOMPParCSR.extracted.28 | Module: exec | Source: IJMatrix_parcsr.c:3240-3484 [...] | Coverage: 0.56% |
---|
Function: hypre_IJMatrixSetValuesOMPParCSR.extracted.28 | Module: exec | Source: IJMatrix_parcsr.c:3240-3484 [...] | Coverage: 0.56% |
---|
/scratch_na/users/xoserete/qaas_runs/171-172-8218/intel/AMG/build/AMG/AMG/IJ_mv/IJMatrix_parcsr.c: 3240 - 3484 |
-------------------------------------------------------------------------------- |
3240: #pragma omp parallel |
[...] |
3256: num_threads = hypre_NumActiveThreads(); |
3257: my_thread_num = hypre_GetThreadNum(); |
3258: |
3259: len = nrows/num_threads; |
3260: rest = nrows - len*num_threads; |
3261: |
3262: if (my_thread_num < rest) |
3263: { |
3264: ns = my_thread_num*(len+1); |
3265: ne = (my_thread_num+1)*(len+1); |
3266: } |
3267: else |
3268: { |
3269: ns = my_thread_num*len+rest; |
3270: ne = (my_thread_num+1)*len+rest; |
3271: } |
3272: |
3273: value_start[my_thread_num] = 0; |
3274: for (ii=ns; ii < ne; ii++) |
3275: value_start[my_thread_num] += ncols[ii]; |
3276: |
3277: #ifdef HYPRE_USING_OPENMP |
3278: #pragma omp barrier |
3279: #endif |
3280: if (my_thread_num == 0) |
3281: { |
3282: for (i=0; i < max_num_threads; i++) |
3283: value_start[i+1] += value_start[i]; |
[...] |
3289: if (my_thread_num) |
3290: indx = value_start[my_thread_num-1]; |
3291: for (ii=ns; ii < ne; ii++) |
3292: { |
3293: row = rows[ii]; |
3294: n = ncols[ii]; |
3295: /* processor owns the row */ |
3296: if (row >= row_partitioning[pstart] && row < row_partitioning[pstart+1]) |
3297: { |
3298: row_local = row - row_partitioning[pstart]; |
3299: /* compute local row number */ |
3300: if (need_aux) |
3301: { |
3302: local_j = aux_j[row_local]; |
3303: local_data = aux_data[row_local]; |
3304: space = row_space[row_local]; |
3305: old_size = row_length[row_local]; |
3306: size = space - old_size; |
3307: if (size < n) |
3308: { |
3309: size = n - size; |
3310: tmp_j = hypre_CTAlloc(HYPRE_Int,size); |
3311: tmp_data = hypre_CTAlloc(HYPRE_Complex,size); |
3312: } |
3313: tmp_indx = 0; |
3314: not_found = 1; |
3315: size = old_size; |
3316: for (i=0; i < n; i++) |
3317: { |
3318: for (j=0; j < old_size; j++) |
3319: { |
3320: if (local_j[j] == cols[indx]) |
3321: { |
3322: local_data[j] = values[indx]; |
[...] |
3329: if (size < space) |
3330: { |
3331: local_j[size] = cols[indx]; |
3332: local_data[size++] = values[indx]; |
3333: } |
3334: else |
3335: { |
3336: tmp_j[tmp_indx] = cols[indx]; |
3337: tmp_data[tmp_indx++] = values[indx]; |
3338: } |
3339: } |
3340: not_found = 1; |
3341: indx++; |
3342: } |
3343: |
3344: row_length[row_local] = size+tmp_indx; |
3345: |
3346: if (tmp_indx) |
3347: { |
3348: aux_j[row_local] = hypre_TReAlloc(aux_j[row_local],HYPRE_Int, |
3349: size+tmp_indx); |
3350: aux_data[row_local] = hypre_TReAlloc(aux_data[row_local], |
3351: HYPRE_Complex,size+tmp_indx); |
3352: row_space[row_local] = size+tmp_indx; |
3353: local_j = aux_j[row_local]; |
[...] |
3359: for (i=0; i < tmp_indx; i++) |
3360: { |
3361: local_j[cnt] = tmp_j[i]; |
3362: local_data[cnt++] = tmp_data[i]; |
3363: } |
3364: |
3365: if (tmp_j) |
3366: { |
3367: hypre_TFree(tmp_j); |
3368: hypre_TFree(tmp_data); |
[...] |
3376: offd_indx = hypre_AuxParCSRMatrixIndxOffd(aux_matrix)[row_local]; |
3377: diag_indx = hypre_AuxParCSRMatrixIndxDiag(aux_matrix)[row_local]; |
3378: cnt_diag = diag_indx; |
3379: cnt_offd = offd_indx; |
3380: diag_space = diag_i[row_local+1]; |
3381: offd_space = offd_i[row_local+1]; |
3382: not_found = 1; |
3383: for (i=0; i < n; i++) |
3384: { |
3385: if (cols[indx] < col_0 || cols[indx] > col_n) |
3386: /* insert into offd */ |
3387: { |
3388: for (j=offd_i[row_local]; j < offd_indx; j++) |
3389: { |
3390: if (offd_j[j] == cols[indx]) |
3391: { |
3392: offd_data[j] = values[indx]; |
[...] |
3399: if (cnt_offd < offd_space) |
3400: { |
3401: offd_j[cnt_offd] = cols[indx]; |
3402: offd_data[cnt_offd++] = values[indx]; |
3403: } |
3404: else |
3405: { |
3406: hypre_error(HYPRE_ERROR_GENERIC); |
3407: #ifdef HYPRE_USING_OPENMP |
3408: #pragma omp atomic |
3409: #endif |
3410: error_flag++; |
[...] |
3422: for (j=diag_i[row_local]; j < diag_indx; j++) |
3423: { |
3424: if (diag_j[j] == cols[indx]) |
3425: { |
3426: diag_data[j] = values[indx]; |
[...] |
3433: if (cnt_diag < diag_space) |
3434: { |
3435: diag_j[cnt_diag] = cols[indx]; |
3436: diag_data[cnt_diag++] = values[indx]; |
3437: } |
3438: else |
3439: { |
3440: hypre_error(HYPRE_ERROR_GENERIC); |
3441: #ifdef HYPRE_USING_OPENMP |
3442: #pragma omp atomic |
3443: #endif |
3444: error_flag++; |
3445: if (print_level) |
[...] |
3454: indx++; |
3455: } |
3456: |
3457: hypre_AuxParCSRMatrixIndxDiag(aux_matrix)[row_local] = cnt_diag; |
3458: hypre_AuxParCSRMatrixIndxOffd(aux_matrix)[row_local] = cnt_offd; |
[...] |
3466: indx += n; |
3467: if (aux_matrix) |
3468: { |
3469: col_indx = 0; |
3470: for (i=0; i < off_proc_i_indx; i=i+2) |
3471: { |
3472: row_len = off_proc_i[i+1]; |
3473: if (off_proc_i[i] == row) |
3474: { |
3475: for (j=0; j < n; j++) |
3476: { |
3477: cnt1 = col_indx; |
3478: for (k=0; k < row_len; k++) |
3479: { |
3480: if (off_proc_j[cnt1] == cols[j]) |
3481: { |
3482: off_proc_j[cnt1++] = -1; |
3483: /*cancel_indx++;*/ |
3484: offproc_cnt[my_thread_num]++; |
0x4e3190 PUSH %RBP |
0x4e3191 MOV %RSP,%RBP |
0x4e3194 PUSH %R15 |
0x4e3196 PUSH %R14 |
0x4e3198 PUSH %R13 |
0x4e319a PUSH %R12 |
0x4e319c PUSH %RBX |
0x4e319d SUB $0x78,%RSP |
0x4e31a1 MOV %R9,%RBX |
0x4e31a4 MOV %R8,-0x78(%RBP) |
0x4e31a8 MOV %RCX,-0x30(%RBP) |
0x4e31ac MOV %RDX,%R14 |
0x4e31af MOV %RDI,%R13 |
0x4e31b2 CALL 4f9c80 <hypre_NumActiveThreads> |
0x4e31b7 MOV %RAX,%R15 |
0x4e31ba CALL 4f9c90 <hypre_GetThreadNum> |
0x4e31bf MOV %RAX,%R12 |
0x4e31c2 MOV %R15,%RAX |
0x4e31c5 OR %R14,%RAX |
0x4e31c8 SHR $0x20,%RAX |
0x4e31cc JE 4e320c |
0x4e31ce MOV %R14,%RAX |
0x4e31d1 CQTO |
0x4e31d3 IDIV %R15 |
0x4e31d6 MOV 0xb8(%RBP),%R14 |
0x4e31dd LEA 0x1(%R12),%RCX |
0x4e31e2 CMP %RDX,%R12 |
0x4e31e5 JGE 4e3225 |
0x4e31e7 LEA 0x1(%RAX),%RSI |
0x4e31eb MOV %RSI,%R8 |
0x4e31ee IMUL %R12,%R8 |
0x4e31f2 IMUL %RCX,%RSI |
0x4e31f6 MOVQ $0,(%R14,%R12,8) |
0x4e31fe CMP %RSI,%R8 |
0x4e3201 MOV %RSI,-0x58(%RBP) |
0x4e3205 JL 4e324e |
0x4e3207 JMP 4e3334 |
0x4e320c MOV %R14D,%EAX |
0x4e320f XOR %EDX,%EDX |
0x4e3211 DIV %R15D |
0x4e3214 MOV 0xb8(%RBP),%R14 |
0x4e321b LEA 0x1(%R12),%RCX |
0x4e3220 CMP %RDX,%R12 |
0x4e3223 JL 4e31e7 |
0x4e3225 MOV %RAX,%R8 |
0x4e3228 IMUL %R12,%R8 |
0x4e322c ADD %RDX,%R8 |
0x4e322f IMUL %RAX,%RCX |
0x4e3233 ADD %RDX,%RCX |
0x4e3236 MOV %RCX,%RSI |
0x4e3239 MOVQ $0,(%R14,%R12,8) |
0x4e3241 CMP %RSI,%R8 |
0x4e3244 MOV %RSI,-0x58(%RBP) |
0x4e3248 JGE 4e3334 |
0x4e324e CMP %RDX,%R12 |
0x4e3251 CMOVL %R12,%RDX |
0x4e3255 IMUL %R12,%RAX |
0x4e3259 ADD %RDX,%RAX |
0x4e325c MOV %RSI,%RDX |
0x4e325f SUB %RAX,%RDX |
0x4e3262 CMP $0x8,%RDX |
0x4e3266 JAE 4e326c |
0x4e3268 XOR %ECX,%ECX |
0x4e326a JMP 4e32b8 |
0x4e326c MOV %RDX,%RSI |
0x4e326f SHR $0x3,%RSI |
0x4e3273 MOV -0x30(%RBP),%RCX |
0x4e3277 LEA (%RCX,%R8,8),%RDI |
0x4e327b ADD $0x38,%RDI |
0x4e327f XOR %ECX,%ECX |
0x4e3281 NOPW %CS:(%RAX,%RAX,1) |
(3347) 0x4e3290 ADD -0x38(%RDI),%RCX |
(3347) 0x4e3294 ADD -0x30(%RDI),%RCX |
(3347) 0x4e3298 ADD -0x28(%RDI),%RCX |
(3347) 0x4e329c ADD -0x20(%RDI),%RCX |
(3347) 0x4e32a0 ADD -0x18(%RDI),%RCX |
(3347) 0x4e32a4 ADD -0x10(%RDI),%RCX |
(3347) 0x4e32a8 ADD -0x8(%RDI),%RCX |
(3347) 0x4e32ac ADD (%RDI),%RCX |
(3347) 0x4e32af ADD $0x40,%RDI |
(3347) 0x4e32b3 DEC %RSI |
(3347) 0x4e32b6 JNE 4e3290 |
0x4e32b8 MOV %EDX,%ESI |
0x4e32ba AND $0x7,%ESI |
0x4e32bd DEC %RSI |
0x4e32c0 CMP $0x6,%RSI |
0x4e32c4 JA 4e3330 |
0x4e32c6 AND $-0x8,%RDX |
0x4e32ca JMP 0x527d78(,%RSI,8) |
0x4e32d1 ADD %RDX,%RAX |
0x4e32d4 MOV -0x30(%RBP),%RDX |
0x4e32d8 JMP 4e332c |
0x4e32da ADD %RDX,%RAX |
0x4e32dd MOV -0x30(%RBP),%RDX |
0x4e32e1 JMP 4e3327 |
0x4e32e3 ADD %RDX,%RAX |
0x4e32e6 MOV -0x30(%RBP),%RDX |
0x4e32ea JMP 4e3322 |
0x4e32ec ADD %RDX,%RAX |
0x4e32ef MOV -0x30(%RBP),%RDX |
0x4e32f3 JMP 4e331d |
0x4e32f5 ADD %RDX,%RAX |
0x4e32f8 MOV -0x30(%RBP),%RDX |
0x4e32fc JMP 4e3318 |
0x4e32fe ADD %RDX,%RAX |
0x4e3301 MOV -0x30(%RBP),%RDX |
0x4e3305 JMP 4e3313 |
0x4e3307 ADD %RDX,%RAX |
0x4e330a MOV -0x30(%RBP),%RDX |
0x4e330e ADD 0x30(%RDX,%RAX,8),%RCX |
0x4e3313 ADD 0x28(%RDX,%RAX,8),%RCX |
0x4e3318 ADD 0x20(%RDX,%RAX,8),%RCX |
0x4e331d ADD 0x18(%RDX,%RAX,8),%RCX |
0x4e3322 ADD 0x10(%RDX,%RAX,8),%RCX |
0x4e3327 ADD 0x8(%RDX,%RAX,8),%RCX |
0x4e332c ADD (%RDX,%RAX,8),%RCX |
0x4e3330 MOV %RCX,(%R14,%R12,8) |
0x4e3334 MOV %R8,%R15 |
0x4e3337 MOV (%R13),%ESI |
0x4e333b MOV $0x74d570,%EDI |
0x4e3340 CALL 410130 <__kmpc_barrier@plt> |
0x4e3345 TEST %R12,%R12 |
0x4e3348 JNE 4e33f2 |
0x4e334e MOV 0xc8(%RBP),%RAX |
0x4e3355 TEST %RAX,%RAX |
0x4e3358 JLE 4e33f2 |
0x4e335e CMP $0x8,%RAX |
0x4e3362 JB 4e33c7 |
0x4e3364 MOV %RAX,%RCX |
0x4e3367 SHR $0x3,%RCX |
0x4e336b MOV (%R14),%RDX |
0x4e336e LEA 0x40(%R14),%RSI |
0x4e3372 NOPW %CS:(%RAX,%RAX,1) |
(3346) 0x4e3380 ADD -0x38(%RSI),%RDX |
(3346) 0x4e3384 MOV %RDX,-0x38(%RSI) |
(3346) 0x4e3388 ADD -0x30(%RSI),%RDX |
(3346) 0x4e338c MOV %RDX,-0x30(%RSI) |
(3346) 0x4e3390 ADD -0x28(%RSI),%RDX |
(3346) 0x4e3394 MOV %RDX,-0x28(%RSI) |
(3346) 0x4e3398 ADD -0x20(%RSI),%RDX |
(3346) 0x4e339c MOV %RDX,-0x20(%RSI) |
(3346) 0x4e33a0 ADD -0x18(%RSI),%RDX |
(3346) 0x4e33a4 MOV %RDX,-0x18(%RSI) |
(3346) 0x4e33a8 ADD -0x10(%RSI),%RDX |
(3346) 0x4e33ac MOV %RDX,-0x10(%RSI) |
(3346) 0x4e33b0 ADD -0x8(%RSI),%RDX |
(3346) 0x4e33b4 MOV %RDX,-0x8(%RSI) |
(3346) 0x4e33b8 ADD (%RSI),%RDX |
(3346) 0x4e33bb MOV %RDX,(%RSI) |
(3346) 0x4e33be ADD $0x40,%RSI |
(3346) 0x4e33c2 DEC %RCX |
(3346) 0x4e33c5 JNE 4e3380 |
0x4e33c7 MOV %RAX,%RCX |
0x4e33ca AND $-0x8,%RCX |
0x4e33ce CMP %RAX,%RCX |
0x4e33d1 JAE 4e33f2 |
0x4e33d3 MOV (%R14,%RCX,8),%RDX |
0x4e33d7 NOPW (%RAX,%RAX,1) |
(3345) 0x4e33e0 ADD 0x8(%R14,%RCX,8),%RDX |
(3345) 0x4e33e5 MOV %RDX,0x8(%R14,%RCX,8) |
(3345) 0x4e33ea INC %RCX |
(3345) 0x4e33ed CMP %RCX,%RAX |
(3345) 0x4e33f0 JNE 4e33e0 |
0x4e33f2 MOV (%R13),%ESI |
0x4e33f6 MOV $0x74d590,%EDI |
0x4e33fb CALL 410130 <__kmpc_barrier@plt> |
0x4e3400 TEST %R12,%R12 |
0x4e3403 JE 4e340c |
0x4e3405 MOV -0x8(%R14,%R12,8),%R9 |
0x4e340a JMP 4e340f |
0x4e340c XOR %R9D,%R9D |
0x4e340f MOV -0x78(%RBP),%R14 |
0x4e3413 MOV -0x30(%RBP),%RDX |
0x4e3417 MOV %R15,%RSI |
0x4e341a MOV -0x58(%RBP),%RDI |
0x4e341e CMP %RDI,%R15 |
0x4e3421 JGE 4e3bcb |
0x4e3427 MOV 0xb0(%RBP),%RAX |
0x4e342e MOV 0xa8(%RBP),%RCX |
0x4e3435 MOV 0x98(%RBP),%R8 |
0x4e343c CMPQ $0,0x18(%RBP) |
0x4e3441 LEA (%RAX,%R12,8),%R13 |
0x4e3445 SETE %AL |
0x4e3448 TEST %R8,%R8 |
0x4e344b SETLE %R10B |
0x4e344f OR %AL,%R10B |
0x4e3452 MOV %R10B,-0x31(%RBP) |
0x4e3456 DEC %R8 |
0x4e3459 SHR $0x1,%R8 |
0x4e345c MOV %R8,-0xa0(%RBP) |
0x4e3463 MOV 0x20(%RBP),%R8 |
0x4e3467 LEA 0x18(%RCX),%RAX |
0x4e346b MOV %RAX,-0x90(%RBP) |
0x4e3472 MOVQ $0,-0x68(%RBP) |
0x4e347a JMP 4e34a4 |
0x4e347c NOPL (%RAX) |
(3331) 0x4e3480 MOV -0x78(%RBP),%R14 |
(3331) 0x4e3484 MOV -0x30(%RBP),%RDX |
(3331) 0x4e3488 MOV -0x60(%RBP),%RSI |
(3331) 0x4e348c MOV -0x58(%RBP),%RDI |
(3331) 0x4e3490 MOV -0x70(%RBP),%R9 |
(3331) 0x4e3494 MOV 0x20(%RBP),%R8 |
(3331) 0x4e3498 INC %RSI |
(3331) 0x4e349b CMP %RDI,%RSI |
(3331) 0x4e349e JGE 4e3bcb |
(3331) 0x4e34a4 MOV (%R14,%RSI,8),%R11 |
(3331) 0x4e34a8 MOV (%RDX,%RSI,8),%R15 |
(3331) 0x4e34ac MOV %R11,-0x50(%RBP) |
(3331) 0x4e34b0 SUB (%R8),%R11 |
(3331) 0x4e34b3 JL 4e3570 |
(3331) 0x4e34b9 MOV -0x50(%RBP),%RAX |
(3331) 0x4e34bd CMP 0x8(%R8),%RAX |
(3331) 0x4e34c1 JGE 4e3570 |
(3331) 0x4e34c7 CMPQ $0,0x58(%RBP) |
(3331) 0x4e34cc MOV %R11,-0x40(%RBP) |
(3331) 0x4e34d0 JE 4e372a |
(3331) 0x4e34d6 MOV 0x38(%RBP),%RAX |
(3331) 0x4e34da MOV (%RAX,%R11,8),%R12 |
(3331) 0x4e34de MOV 0x40(%RBP),%RAX |
(3331) 0x4e34e2 MOV (%RAX,%R11,8),%RAX |
(3331) 0x4e34e6 MOV %RAX,-0x88(%RBP) |
(3331) 0x4e34ed MOV 0x50(%RBP),%RAX |
(3331) 0x4e34f1 MOV (%RAX,%R11,8),%RCX |
(3331) 0x4e34f5 MOV 0x48(%RBP),%RAX |
(3331) 0x4e34f9 MOV (%RAX,%R11,8),%R14 |
(3331) 0x4e34fd MOV %RCX,-0x98(%RBP) |
(3331) 0x4e3504 MOV %RCX,%RAX |
(3331) 0x4e3507 SUB %R14,%RAX |
(3331) 0x4e350a MOV %R15,%RCX |
(3331) 0x4e350d SUB %RAX,%RCX |
(3331) 0x4e3510 MOV %RSI,-0x60(%RBP) |
(3331) 0x4e3514 JLE 4e388a |
(3331) 0x4e351a MOV $0x8,%ESI |
(3331) 0x4e351f MOV %RCX,%RDI |
(3331) 0x4e3522 MOV %RCX,-0x50(%RBP) |
(3331) 0x4e3526 MOV %R9,-0x70(%RBP) |
(3331) 0x4e352a CALL 4f7e60 <hypre_CAlloc> |
(3331) 0x4e352f MOV %RAX,-0x80(%RBP) |
(3331) 0x4e3533 MOV $0x8,%ESI |
(3331) 0x4e3538 MOV -0x50(%RBP),%RDI |
(3331) 0x4e353c CALL 4f7e60 <hypre_CAlloc> |
(3331) 0x4e3541 MOV -0x80(%RBP),%R10 |
(3331) 0x4e3545 MOV -0x40(%RBP),%R11 |
(3331) 0x4e3549 MOV -0x70(%RBP),%R9 |
(3331) 0x4e354d MOV 0x10(%RBP),%RDI |
(3331) 0x4e3551 TEST %R15,%R15 |
(3331) 0x4e3554 MOV %RAX,%RCX |
(3331) 0x4e3557 MOV %RAX,-0x68(%RBP) |
(3331) 0x4e355b JG 4e38a5 |
(3331) 0x4e3561 MOV 0x48(%RBP),%RAX |
(3331) 0x4e3565 MOV %R14,(%RAX,%R11,8) |
(3331) 0x4e3569 JMP 4e3a7d |
0x4e356e XCHG %AX,%AX |
(3331) 0x4e3570 ADD %R15,%R9 |
(3331) 0x4e3573 CMPB $0,-0x31(%RBP) |
(3331) 0x4e3577 JNE 4e3498 |
(3331) 0x4e357d TEST %R15,%R15 |
(3331) 0x4e3580 JLE 4e3498 |
(3331) 0x4e3586 MOV %R9,-0x70(%RBP) |
(3331) 0x4e358a MOV %RSI,-0x60(%RBP) |
(3331) 0x4e358e DEC %R15 |
(3331) 0x4e3591 XOR %ECX,%ECX |
(3331) 0x4e3593 XOR %EAX,%EAX |
(3331) 0x4e3595 JMP 4e35b1 |
0x4e3597 NOPW (%RAX,%RAX,1) |
(3332) 0x4e35a0 CMP -0xa0(%RBP),%RAX |
(3332) 0x4e35a7 LEA 0x1(%RAX),%RAX |
(3332) 0x4e35ab JE 4e3480 |
(3332) 0x4e35b1 MOV %RCX,%R9 |
(3332) 0x4e35b4 MOV %RAX,%RSI |
(3332) 0x4e35b7 SAL $0x4,%RSI |
(3332) 0x4e35bb MOV 0xa0(%RBP),%RDI |
(3332) 0x4e35c2 MOV 0x8(%RDI,%RSI,1),%RDX |
(3332) 0x4e35c7 ADD %RDX,%RCX |
(3332) 0x4e35ca MOV -0x50(%RBP),%R8 |
(3332) 0x4e35ce CMP %R8,(%RDI,%RSI,1) |
(3332) 0x4e35d2 JNE 4e35a0 |
(3332) 0x4e35d4 TEST %RDX,%RDX |
(3332) 0x4e35d7 JLE 4e35a0 |
(3332) 0x4e35d9 MOV 0xa8(%RBP),%RSI |
(3332) 0x4e35e0 LEA (%RSI,%RCX,8),%RDI |
(3332) 0x4e35e4 ADD $-0x8,%RDI |
(3332) 0x4e35e8 LEA (%RSI,%R9,8),%RSI |
(3332) 0x4e35ec CMP %R13,%RDI |
(3332) 0x4e35ef JB 4e3640 |
(3332) 0x4e35f1 CMP %RSI,%R13 |
(3332) 0x4e35f4 JB 4e3640 |
(3332) 0x4e35f6 XOR %EDI,%EDI |
(3332) 0x4e35f8 JMP 4e3609 |
0x4e35fa NOPW (%RAX,%RAX,1) |
(3336) 0x4e3600 CMP %R15,%RDI |
(3336) 0x4e3603 LEA 0x1(%RDI),%RDI |
(3336) 0x4e3607 JE 4e35a0 |
(3336) 0x4e3609 MOV (%RBX,%RDI,8),%R8 |
(3336) 0x4e360d XOR %R9D,%R9D |
(3336) 0x4e3610 JMP 4e3628 |
0x4e3612 NOPW %CS:(%RAX,%RAX,1) |
(3337) 0x4e3620 INC %R9 |
(3337) 0x4e3623 CMP %R9,%RDX |
(3337) 0x4e3626 JE 4e3600 |
(3337) 0x4e3628 CMP %R8,(%RSI,%R9,8) |
(3337) 0x4e362c JNE 4e3620 |
(3337) 0x4e362e MOVQ $-0x1,(%RSI,%R9,8) |
(3337) 0x4e3636 INCQ (%R13) |
(3337) 0x4e363a JMP 4e3620 |
0x4e363c NOPL (%RAX) |
(3332) 0x4e3640 MOV %RDX,%RDI |
(3332) 0x4e3643 SHR $0x2,%RDI |
(3332) 0x4e3647 MOV %RDX,%R8 |
(3332) 0x4e364a AND $-0x4,%R8 |
(3332) 0x4e364e MOV -0x90(%RBP),%R10 |
(3332) 0x4e3655 LEA (%R10,%R9,8),%R14 |
(3332) 0x4e3659 XOR %R10D,%R10D |
(3332) 0x4e365c JMP 4e366d |
0x4e365e XCHG %AX,%AX |
(3333) 0x4e3660 CMP %R15,%R10 |
(3333) 0x4e3663 LEA 0x1(%R10),%R10 |
(3333) 0x4e3667 JE 4e35a0 |
(3333) 0x4e366d MOV (%RBX,%R10,8),%R11 |
(3333) 0x4e3671 CMP $0x4,%RDX |
(3333) 0x4e3675 JAE 4e36b0 |
(3333) 0x4e3677 CMP %RDX,%R8 |
(3333) 0x4e367a JAE 4e3660 |
(3333) 0x4e367c MOV %R8,%R9 |
(3333) 0x4e367f JMP 4e3698 |
0x4e3681 NOPW %CS:(%RAX,%RAX,1) |
(3334) 0x4e3690 INC %R9 |
(3334) 0x4e3693 CMP %R9,%RDX |
(3334) 0x4e3696 JE 4e3660 |
(3334) 0x4e3698 CMP %R11,(%RSI,%R9,8) |
(3334) 0x4e369c JNE 4e3690 |
(3334) 0x4e369e MOVQ $-0x1,(%RSI,%R9,8) |
(3334) 0x4e36a6 INCQ (%R13) |
(3334) 0x4e36aa JMP 4e3690 |
0x4e36ac NOPL (%RAX) |
(3333) 0x4e36b0 MOV %RDI,%R12 |
(3333) 0x4e36b3 MOV %R14,%R9 |
(3333) 0x4e36b6 JMP 4e36c9 |
0x4e36b8 NOPL (%RAX,%RAX,1) |
(3335) 0x4e36c0 ADD $0x20,%R9 |
(3335) 0x4e36c4 DEC %R12 |
(3335) 0x4e36c7 JE 4e3677 |
(3335) 0x4e36c9 CMP %R11,-0x18(%R9) |
(3335) 0x4e36cd JNE 4e3700 |
(3335) 0x4e36cf MOVQ $-0x1,-0x18(%R9) |
(3335) 0x4e36d7 INCQ (%R13) |
(3335) 0x4e36db CMP %R11,-0x10(%R9) |
(3335) 0x4e36df JE 4e3706 |
(3335) 0x4e36e1 CMP %R11,-0x8(%R9) |
(3335) 0x4e36e5 JNE 4e3718 |
(3335) 0x4e36e7 MOVQ $-0x1,-0x8(%R9) |
(3335) 0x4e36ef INCQ (%R13) |
(3335) 0x4e36f3 CMP %R11,(%R9) |
(3335) 0x4e36f6 JNE 4e36c0 |
(3335) 0x4e36f8 JMP 4e371d |
0x4e36fa NOPW (%RAX,%RAX,1) |
(3335) 0x4e3700 CMP %R11,-0x10(%R9) |
(3335) 0x4e3704 JNE 4e36e1 |
(3335) 0x4e3706 MOVQ $-0x1,-0x10(%R9) |
(3335) 0x4e370e INCQ (%R13) |
(3335) 0x4e3712 CMP %R11,-0x8(%R9) |
(3335) 0x4e3716 JE 4e36e7 |
(3335) 0x4e3718 CMP %R11,(%R9) |
(3335) 0x4e371b JNE 4e36c0 |
(3335) 0x4e371d MOVQ $-0x1,(%R9) |
(3335) 0x4e3724 INCQ (%R13) |
(3335) 0x4e3728 JMP 4e36c0 |
(3331) 0x4e372a MOV 0x18(%RBP),%RAX |
(3331) 0x4e372e MOV 0x38(%RAX),%RCX |
(3331) 0x4e3732 MOV 0x40(%RAX),%RAX |
(3331) 0x4e3736 MOV (%RAX,%R11,8),%RAX |
(3331) 0x4e373a MOV (%RCX,%R11,8),%RCX |
(3331) 0x4e373e TEST %R15,%R15 |
(3331) 0x4e3741 JLE 4e3a52 |
(3331) 0x4e3747 MOV %RSI,-0x60(%RBP) |
(3331) 0x4e374b MOV 0x60(%RBP),%RDX |
(3331) 0x4e374f MOV 0x8(%RDX,%R11,8),%RDX |
(3331) 0x4e3754 MOV 0x78(%RBP),%RSI |
(3331) 0x4e3758 MOV 0x8(%RSI,%R11,8),%RSI |
(3331) 0x4e375d XOR %EDI,%EDI |
(3331) 0x4e375f MOV %RAX,%R14 |
(3331) 0x4e3762 MOV %RCX,-0x48(%RBP) |
(3331) 0x4e3766 LEA (%R9,%R15,1),%R8 |
(3331) 0x4e376a JMP 4e3796 |
(3338) 0x4e376c MOV %R12,%R9 |
(3338) 0x4e376f MOV 0x10(%RBP),%R11 |
(3338) 0x4e3773 VMOVSD (%R11,%R12,8),%XMM0 |
(3338) 0x4e3779 MOV 0x70(%RBP),%R11 |
(3338) 0x4e377d VMOVSD %XMM0,(%R11,%R10,8) |
(3338) 0x4e3783 MOV -0x40(%RBP),%R11 |
(3338) 0x4e3787 INC %R9 |
(3338) 0x4e378a INC %RDI |
(3338) 0x4e378d CMP %R15,%RDI |
(3338) 0x4e3790 JE 4e3a5d |
(3338) 0x4e3796 MOV %R9,%R12 |
(3338) 0x4e3799 MOV (%RBX,%R9,8),%R9 |
(3338) 0x4e379d CMP 0x28(%RBP),%R9 |
(3338) 0x4e37a1 JL 4e3810 |
(3338) 0x4e37a3 CMP 0x30(%RBP),%R9 |
(3338) 0x4e37a7 JG 4e3810 |
(3338) 0x4e37a9 MOV 0x60(%RBP),%R10 |
(3338) 0x4e37ad MOV (%R10,%R11,8),%R10 |
(3338) 0x4e37b1 CMP %RCX,%R10 |
(3338) 0x4e37b4 JGE 4e37d2 |
(3338) 0x4e37b6 NOPW %CS:(%RAX,%RAX,1) |
(3340) 0x4e37c0 MOV 0x68(%RBP),%R11 |
(3340) 0x4e37c4 CMP %R9,(%R11,%R10,8) |
(3340) 0x4e37c8 JE 4e376c |
(3340) 0x4e37ca INC %R10 |
(3340) 0x4e37cd CMP %R10,%RCX |
(3340) 0x4e37d0 JNE 4e37c0 |
(3338) 0x4e37d2 MOV -0x48(%RBP),%R11 |
(3338) 0x4e37d6 CMP %RDX,%R11 |
(3338) 0x4e37d9 JGE 4e3ac0 |
(3338) 0x4e37df MOV 0x68(%RBP),%R10 |
(3338) 0x4e37e3 MOV %R9,(%R10,%R11,8) |
(3338) 0x4e37e7 MOV %R12,%R9 |
(3338) 0x4e37ea MOV 0x10(%RBP),%R10 |
(3338) 0x4e37ee VMOVSD (%R10,%R12,8),%XMM0 |
(3338) 0x4e37f4 MOV 0x70(%RBP),%R10 |
(3338) 0x4e37f8 VMOVSD %XMM0,(%R10,%R11,8) |
(3338) 0x4e37fe INC %R11 |
(3338) 0x4e3801 MOV %R11,-0x48(%RBP) |
(3338) 0x4e3805 JMP 4e3783 |
0x4e380a NOPW (%RAX,%RAX,1) |
(3338) 0x4e3810 MOV 0x78(%RBP),%R10 |
(3338) 0x4e3814 MOV (%R10,%R11,8),%R10 |
(3338) 0x4e3818 CMP %RAX,%R10 |
(3338) 0x4e381b JGE 4e3835 |
(3338) 0x4e381d NOPL (%RAX) |
(3339) 0x4e3820 MOV 0x80(%RBP),%R11 |
(3339) 0x4e3827 CMP %R9,(%R11,%R10,8) |
(3339) 0x4e382b JE 4e3871 |
(3339) 0x4e382d INC %R10 |
(3339) 0x4e3830 CMP %R10,%RAX |
(3339) 0x4e3833 JNE 4e3820 |
(3338) 0x4e3835 CMP %RSI,%R14 |
(3338) 0x4e3838 JGE 4e3af6 |
(3338) 0x4e383e MOV %R14,%R11 |
(3338) 0x4e3841 MOV 0x80(%RBP),%R10 |
(3338) 0x4e3848 MOV %R9,(%R10,%R14,8) |
(3338) 0x4e384c MOV %R12,%R9 |
(3338) 0x4e384f MOV 0x10(%RBP),%R10 |
(3338) 0x4e3853 VMOVSD (%R10,%R12,8),%XMM0 |
(3338) 0x4e3859 MOV 0x88(%RBP),%R10 |
(3338) 0x4e3860 VMOVSD %XMM0,(%R10,%R14,8) |
(3338) 0x4e3866 INC %R11 |
(3338) 0x4e3869 MOV %R11,%R14 |
(3338) 0x4e386c JMP 4e3783 |
(3338) 0x4e3871 MOV %R12,%R9 |
(3338) 0x4e3874 MOV 0x10(%RBP),%R11 |
(3338) 0x4e3878 VMOVSD (%R11,%R12,8),%XMM0 |
(3338) 0x4e387e MOV 0x88(%RBP),%R11 |
(3338) 0x4e3885 JMP 4e377d |
(3331) 0x4e388a XOR %R10D,%R10D |
(3331) 0x4e388d MOV 0x10(%RBP),%RDI |
(3331) 0x4e3891 MOV -0x68(%RBP),%RAX |
(3331) 0x4e3895 TEST %R15,%R15 |
(3331) 0x4e3898 MOV %RAX,%RCX |
(3331) 0x4e389b MOV %RAX,-0x68(%RBP) |
(3331) 0x4e389f JLE 4e3561 |
(3331) 0x4e38a5 XOR %R8D,%R8D |
(3331) 0x4e38a8 MOV %R14,-0x50(%RBP) |
(3331) 0x4e38ac MOV %R9,%RCX |
(3331) 0x4e38af MOVQ $0,-0x48(%RBP) |
(3331) 0x4e38b7 JMP 4e38df |
0x4e38b9 NOPL (%RAX) |
(3343) 0x4e38c0 MOV -0x48(%RBP),%RSI |
(3343) 0x4e38c4 MOV %RDX,(%R10,%RSI,8) |
(3343) 0x4e38c8 VMOVSD %XMM0,(%RAX,%RSI,8) |
(3343) 0x4e38cd INC %RSI |
(3343) 0x4e38d0 MOV %RSI,-0x48(%RBP) |
(3343) 0x4e38d4 INC %RCX |
(3343) 0x4e38d7 INC %R8 |
(3343) 0x4e38da CMP %R15,%R8 |
(3343) 0x4e38dd JE 4e3943 |
(3343) 0x4e38df MOV (%RBX,%RCX,8),%RDX |
(3343) 0x4e38e3 TEST %R14,%R14 |
(3343) 0x4e38e6 JLE 4e38fe |
(3343) 0x4e38e8 XOR %ESI,%ESI |
(3343) 0x4e38ea NOPW (%RAX,%RAX,1) |
(3344) 0x4e38f0 CMP %RDX,(%R12,%RSI,8) |
(3344) 0x4e38f4 JE 4e3930 |
(3344) 0x4e38f6 INC %RSI |
(3344) 0x4e38f9 CMP %RSI,%R14 |
(3344) 0x4e38fc JNE 4e38f0 |
(3343) 0x4e38fe VMOVSD (%RDI,%RCX,8),%XMM0 |
(3343) 0x4e3903 MOV -0x50(%RBP),%RSI |
(3343) 0x4e3907 CMP -0x98(%RBP),%RSI |
(3343) 0x4e390e JGE 4e38c0 |
(3343) 0x4e3910 MOV %RDX,(%R12,%RSI,8) |
(3343) 0x4e3914 MOV -0x88(%RBP),%RDX |
(3343) 0x4e391b VMOVSD %XMM0,(%RDX,%RSI,8) |
(3343) 0x4e3920 INC %RSI |
(3343) 0x4e3923 MOV %RSI,-0x50(%RBP) |
(3343) 0x4e3927 JMP 4e38d4 |
0x4e3929 NOPL (%RAX) |
(3343) 0x4e3930 VMOVSD (%RDI,%RCX,8),%XMM0 |
(3343) 0x4e3935 MOV -0x88(%RBP),%RDX |
(3343) 0x4e393c VMOVSD %XMM0,(%RDX,%RSI,8) |
(3343) 0x4e3941 JMP 4e38d4 |
(3331) 0x4e3943 ADD %R15,%R9 |
(3331) 0x4e3946 MOV -0x48(%RBP),%RCX |
(3331) 0x4e394a MOV -0x50(%RBP),%RAX |
(3331) 0x4e394e LEA (%RAX,%RCX,1),%R14 |
(3331) 0x4e3952 MOV 0x48(%RBP),%RAX |
(3331) 0x4e3956 MOV %R14,(%RAX,%R11,8) |
(3331) 0x4e395a TEST %RCX,%RCX |
(3331) 0x4e395d JE 4e3a7d |
(3331) 0x4e3963 MOV %R10,-0x80(%RBP) |
(3331) 0x4e3967 MOV %R9,-0x70(%RBP) |
(3331) 0x4e396b MOV 0x38(%RBP),%R12 |
(3331) 0x4e396f MOV (%R12,%R11,8),%RDI |
(3331) 0x4e3973 LEA (,%R14,8),%R15 |
(3331) 0x4e397b MOV %R15,%RSI |
(3331) 0x4e397e CALL 4f7ed0 <hypre_ReAlloc> |
(3331) 0x4e3983 MOV -0x40(%RBP),%RCX |
(3331) 0x4e3987 MOV %RAX,(%R12,%RCX,8) |
(3331) 0x4e398b MOV 0x40(%RBP),%R12 |
(3331) 0x4e398f MOV -0x40(%RBP),%RAX |
(3331) 0x4e3993 MOV (%R12,%RAX,8),%RDI |
(3331) 0x4e3997 MOV %R15,%RSI |
(3331) 0x4e399a CALL 4f7ed0 <hypre_ReAlloc> |
(3331) 0x4e399f MOV -0x40(%RBP),%RDX |
(3331) 0x4e39a3 MOV %RAX,(%R12,%RDX,8) |
(3331) 0x4e39a7 MOV -0x48(%RBP),%R12 |
(3331) 0x4e39ab MOV 0x50(%RBP),%RCX |
(3331) 0x4e39af MOV %R14,(%RCX,%RDX,8) |
(3331) 0x4e39b3 TEST %R12,%R12 |
(3331) 0x4e39b6 JLE 4e3a75 |
(3331) 0x4e39bc MOV 0x38(%RBP),%RCX |
(3331) 0x4e39c0 MOV (%RCX,%RDX,8),%RCX |
(3331) 0x4e39c4 MOV -0x80(%RBP),%R10 |
(3331) 0x4e39c8 LEA (%R10,%R12,8),%RDX |
(3331) 0x4e39cc ADD $-0x8,%RDX |
(3331) 0x4e39d0 MOV -0x50(%RBP),%R11 |
(3331) 0x4e39d4 LEA (%RCX,%R11,8),%RDI |
(3331) 0x4e39d8 CMP %RDI,%RDX |
(3331) 0x4e39db SETAE %DL |
(3331) 0x4e39de LEA (%R12,%R11,1),%RSI |
(3331) 0x4e39e2 DEC %RSI |
(3331) 0x4e39e5 LEA (%RCX,%RSI,8),%RCX |
(3331) 0x4e39e9 CMP %R10,%RCX |
(3331) 0x4e39ec SETAE %R8B |
(3331) 0x4e39f0 MOV -0x68(%RBP),%R9 |
(3331) 0x4e39f4 LEA (%R9,%R12,8),%RCX |
(3331) 0x4e39f8 ADD $-0x8,%RCX |
(3331) 0x4e39fc LEA (%RAX,%R11,8),%R15 |
(3331) 0x4e3a00 CMP %R15,%RCX |
(3331) 0x4e3a03 SETB %CL |
(3331) 0x4e3a06 LEA (%RAX,%RSI,8),%RAX |
(3331) 0x4e3a0a CMP %R9,%RAX |
(3331) 0x4e3a0d SETB %AL |
(3331) 0x4e3a10 TEST %R8B,%DL |
(3331) 0x4e3a13 JNE 4e3a8f |
(3331) 0x4e3a15 OR %AL,%CL |
(3331) 0x4e3a17 JE 4e3a8f |
(3331) 0x4e3a19 CMP $0xc,%R12 |
(3331) 0x4e3a1d MOV -0x78(%RBP),%R14 |
(3331) 0x4e3a21 JBE 4e3b6c |
(3331) 0x4e3a27 SAL $0x3,%R12 |
(3331) 0x4e3a2b MOV %R10,%RSI |
(3331) 0x4e3a2e MOV %R12,%RDX |
(3331) 0x4e3a31 CALL 5010d0 <_intel_fast_memcpy> |
(3331) 0x4e3a36 MOV %R15,%RDI |
(3331) 0x4e3a39 MOV -0x68(%RBP),%RSI |
(3331) 0x4e3a3d MOV %R12,%RDX |
(3331) 0x4e3a40 CALL 5010d0 <_intel_fast_memcpy> |
(3331) 0x4e3a45 MOV -0x80(%RBP),%R10 |
(3331) 0x4e3a49 MOV -0x70(%RBP),%R9 |
(3331) 0x4e3a4d JMP 4e3b9b |
(3331) 0x4e3a52 MOV %RCX,%R10 |
(3331) 0x4e3a55 MOV %RAX,%R14 |
(3331) 0x4e3a58 JMP 4e3b4f |
(3331) 0x4e3a5d MOV %R8,%R9 |
(3331) 0x4e3a60 MOV -0x30(%RBP),%RDX |
(3331) 0x4e3a64 MOV -0x60(%RBP),%RSI |
(3331) 0x4e3a68 MOV -0x58(%RBP),%RDI |
(3331) 0x4e3a6c MOV 0x20(%RBP),%R8 |
(3331) 0x4e3a70 JMP 4e3b4b |
(3331) 0x4e3a75 MOV -0x70(%RBP),%R9 |
(3331) 0x4e3a79 MOV -0x80(%RBP),%R10 |
(3331) 0x4e3a7d TEST %R10,%R10 |
(3331) 0x4e3a80 MOV -0x78(%RBP),%R14 |
(3331) 0x4e3a84 JNE 4e3b9b |
(3331) 0x4e3a8a JMP 4e3bba |
(3331) 0x4e3a8f XOR %EAX,%EAX |
(3331) 0x4e3a91 MOV -0x78(%RBP),%R14 |
(3331) 0x4e3a95 MOV -0x70(%RBP),%R9 |
(3331) 0x4e3a99 MOV -0x68(%RBP),%RDX |
(3331) 0x4e3a9d NOPL (%RAX) |
(3341) 0x4e3aa0 MOV (%R10,%RAX,8),%RCX |
(3341) 0x4e3aa4 MOV %RCX,(%RDI,%RAX,8) |
(3341) 0x4e3aa8 VMOVSD (%RDX,%RAX,8),%XMM0 |
(3341) 0x4e3aad VMOVSD %XMM0,(%R15,%RAX,8) |
(3341) 0x4e3ab3 INC %RAX |
(3341) 0x4e3ab6 CMP %RAX,%R12 |
(3341) 0x4e3ab9 JNE 4e3aa0 |
(3331) 0x4e3abb JMP 4e3b9b |
(3331) 0x4e3ac0 MOV -0x50(%RBP),%R15 |
(3331) 0x4e3ac4 MOV $0x528c03,%EDI |
(3331) 0x4e3ac9 MOV $0xd70,%ESI |
(3331) 0x4e3ace MOV $0x1,%EDX |
(3331) 0x4e3ad3 XOR %ECX,%ECX |
(3331) 0x4e3ad5 CALL 4faac0 <hypre_error_handler> |
(3331) 0x4e3ada MOV 0xd0(%RBP),%RAX |
(3331) 0x4e3ae1 LOCK INCQ (%RAX) |
(3331) 0x4e3ae5 MOV $0x528d85,%EDI |
(3331) 0x4e3aea CMPQ $0,0xc0(%RBP) |
(3331) 0x4e3af2 JNE 4e3b2a |
(3331) 0x4e3af4 JMP 4e3b34 |
(3331) 0x4e3af6 MOV -0x50(%RBP),%R15 |
(3331) 0x4e3afa MOV $0x528c03,%EDI |
(3331) 0x4e3aff MOV $0xd4e,%ESI |
(3331) 0x4e3b04 MOV $0x1,%EDX |
(3331) 0x4e3b09 XOR %ECX,%ECX |
(3331) 0x4e3b0b CALL 4faac0 <hypre_error_handler> |
(3331) 0x4e3b10 MOV 0xd0(%RBP),%RAX |
(3331) 0x4e3b17 LOCK INCQ (%RAX) |
(3331) 0x4e3b1b MOV $0x528d5f,%EDI |
(3331) 0x4e3b20 CMPQ $0,0xc0(%RBP) |
(3331) 0x4e3b28 JE 4e3b34 |
(3331) 0x4e3b2a MOV %R15,%RSI |
(3331) 0x4e3b2d XOR %EAX,%EAX |
(3331) 0x4e3b2f CALL 4f8030 <hypre_printf> |
(3331) 0x4e3b34 MOV -0x30(%RBP),%RDX |
(3331) 0x4e3b38 MOV -0x60(%RBP),%RSI |
(3331) 0x4e3b3c MOV -0x58(%RBP),%RDI |
(3331) 0x4e3b40 MOV %R12,%R9 |
(3331) 0x4e3b43 MOV 0x20(%RBP),%R8 |
(3331) 0x4e3b47 MOV -0x40(%RBP),%R11 |
(3331) 0x4e3b4b MOV -0x48(%RBP),%R10 |
(3331) 0x4e3b4f MOV 0x18(%RBP),%RCX |
(3331) 0x4e3b53 MOV 0x38(%RCX),%RAX |
(3331) 0x4e3b57 MOV %R10,(%RAX,%R11,8) |
(3331) 0x4e3b5b MOV 0x40(%RCX),%RAX |
(3331) 0x4e3b5f MOV %R14,(%RAX,%R11,8) |
(3331) 0x4e3b63 MOV -0x78(%RBP),%R14 |
(3331) 0x4e3b67 JMP 4e3498 |
(3331) 0x4e3b6c XOR %EAX,%EAX |
(3331) 0x4e3b6e MOV -0x70(%RBP),%R9 |
(3331) 0x4e3b72 MOV -0x68(%RBP),%RDX |
(3331) 0x4e3b76 NOPW %CS:(%RAX,%RAX,1) |
(3342) 0x4e3b80 MOV (%R10,%RAX,8),%RCX |
(3342) 0x4e3b84 MOV %RCX,(%RDI,%RAX,8) |
(3342) 0x4e3b88 VMOVSD (%RDX,%RAX,8),%XMM0 |
(3342) 0x4e3b8d VMOVSD %XMM0,(%R15,%RAX,8) |
(3342) 0x4e3b93 INC %RAX |
(3342) 0x4e3b96 CMP %RAX,%R12 |
(3342) 0x4e3b99 JNE 4e3b80 |
(3331) 0x4e3b9b MOV %R10,%RDI |
(3331) 0x4e3b9e MOV %R9,%R15 |
(3331) 0x4e3ba1 CALL 4f7f50 <hypre_Free> |
(3331) 0x4e3ba6 MOV -0x68(%RBP),%RDI |
(3331) 0x4e3baa CALL 4f7f50 <hypre_Free> |
(3331) 0x4e3baf MOV %R15,%R9 |
(3331) 0x4e3bb2 MOVQ $0,-0x68(%RBP) |
(3331) 0x4e3bba MOV -0x30(%RBP),%RDX |
(3331) 0x4e3bbe MOV -0x60(%RBP),%RSI |
(3331) 0x4e3bc2 MOV -0x58(%RBP),%RDI |
(3331) 0x4e3bc6 JMP 4e3494 |
0x4e3bcb ADD $0x78,%RSP |
0x4e3bcf POP %RBX |
0x4e3bd0 POP %R12 |
0x4e3bd2 POP %R13 |
0x4e3bd4 POP %R14 |
0x4e3bd6 POP %R15 |
0x4e3bd8 POP %RBP |
0x4e3bd9 RET |
0x4e3bda NOPW (%RAX,%RAX,1) |
Path / |
Source file and lines | IJMatrix_parcsr.c:3240-3484 |
Module | exec |
nb instructions | 183 |
nb uops | 194 |
loop length | 734 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 33.50 cycles |
front end | 33.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 14.90 | 14.80 | 13.00 | 13.00 | 10.50 | 14.80 | 14.70 | 10.50 | 10.50 | 10.50 | 14.80 | 13.00 |
cycles | 14.90 | 19.00 | 13.00 | 13.00 | 10.50 | 14.80 | 14.70 | 10.50 | 10.50 | 10.50 | 14.80 | 13.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 32.54 |
Stall cycles | 0.00 |
Front-end | 33.50 |
Dispatch | 19.00 |
DIV/SQRT | 16.00 |
Overall L1 | 33.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 11% |
load | 12% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4f9c80 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4f9c90 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R14,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4e320c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R15 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV 0xb8(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R12),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4e3225 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x95> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%RAX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R12,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
IMUL %RCX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOVQ $0,(%R14,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JL 4e324e <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4e3334 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x1a4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R14D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R15D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV 0xb8(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R12),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4e31e7 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x57> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R12,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVQ $0,(%R14,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4e3334 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x1a4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %R12,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %R12,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP $0x8,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4e326c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xdc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4e32b8 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x128> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RDX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV -0x30(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%R8,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x38,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDX,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $0x7,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x6,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 4e3330 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x1a0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
AND $-0x8,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JMP 0x527d78(,%RSI,8) | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e332c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x19c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e3327 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x197> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e3322 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x192> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e331d <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x18d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e3318 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x188> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e3313 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x183> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD 0x30(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD 0x28(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD 0x20(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD 0x18(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD 0x10(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD 0x8(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD (%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RCX,(%R14,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d570,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410130 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4e33f2 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x262> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4e33f2 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x262> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4e33c7 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x237> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R14),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x40(%R14),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x8,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4e33f2 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x262> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R14,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d590,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410130 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4e340c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x27c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x8(%R14,%R12,8),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e340f <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x27f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x78(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x58(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4e3bcb <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xa3b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x98(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,0x18(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
LEA (%RAX,%R12,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SETE %AL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %R8,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
SETLE %R10B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
OR %AL,%R10B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R10B,-0x31(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x1,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R8,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x18(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4e34a4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x314> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | IJMatrix_parcsr.c:3240-3484 |
Module | exec |
nb instructions | 183 |
nb uops | 194 |
loop length | 734 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 0 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 14 |
micro-operation queue | 33.50 cycles |
front end | 33.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 14.90 | 14.80 | 13.00 | 13.00 | 10.50 | 14.80 | 14.70 | 10.50 | 10.50 | 10.50 | 14.80 | 13.00 |
cycles | 14.90 | 19.00 | 13.00 | 13.00 | 10.50 | 14.80 | 14.70 | 10.50 | 10.50 | 10.50 | 14.80 | 13.00 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 32.54 |
Stall cycles | 0.00 |
Front-end | 33.50 |
Dispatch | 19.00 |
DIV/SQRT | 16.00 |
Overall L1 | 33.50 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
all | 11% |
load | 12% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0x78(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x30(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4f9c80 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4f9c90 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R14,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4e320c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x7c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R14,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R15 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
MOV 0xb8(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R12),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4e3225 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x95> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%RAX),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R12,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
IMUL %RCX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOVQ $0,(%R14,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JL 4e324e <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xbe> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4e3334 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x1a4> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
MOV %R14D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R15D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV 0xb8(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R12),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 4e31e7 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x57> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R12,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVQ $0,(%R14,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
CMP %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,-0x58(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4e3334 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x1a4> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RDX,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %R12,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %R12,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP $0x8,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4e326c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xdc> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4e32b8 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x128> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RDX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV -0x30(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RCX,%R8,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x38,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %ECX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %EDX,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $0x7,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
DEC %RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP $0x6,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JA 4e3330 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x1a0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
AND $-0x8,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JMP 0x527d78(,%RSI,8) | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e332c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x19c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e3327 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x197> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e3322 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x192> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e331d <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x18d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e3318 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x188> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e3313 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x183> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
ADD %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD 0x30(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD 0x28(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD 0x20(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD 0x18(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD 0x10(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD 0x8(%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
ADD (%RDX,%RAX,8),%RCX | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %RCX,(%R14,%R12,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d570,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410130 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4e33f2 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x262> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4e33f2 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x262> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4e33c7 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x237> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R14),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x40(%R14),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x8,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4e33f2 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x262> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R14,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x74d590,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 410130 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R12,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4e340c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x27c> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x8(%R14,%R12,8),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4e340f <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x27f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x78(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x58(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%R15 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4e3bcb <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xa3b> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x98(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMPQ $0,0x18(%RBP) | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
LEA (%RAX,%R12,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SETE %AL | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %R8,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
SETLE %R10B | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
OR %AL,%R10B | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %R10B,-0x31(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
DEC %R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x1,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %R8,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x18(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0x90(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0,-0x68(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4e34a4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x314> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_IJMatrixSetValuesOMPParCSR.extracted.28– | 0.56 | 0.13 |
▼Loop 3331 - IJMatrix_parcsr.c:3262-3484 - exec– | 0.05 | 0.01 |
▼Loop 3338 - IJMatrix_parcsr.c:3383-3454 - exec– | 0.51 | 0.1 |
○Loop 3339 - IJMatrix_parcsr.c:3388-3390 - exec | 0 | 0 |
○Loop 3340 - IJMatrix_parcsr.c:3422-3424 - exec | 0 | 0 |
▼Loop 3343 - IJMatrix_parcsr.c:3316-3341 - exec– | 0 | 0 |
○Loop 3344 - IJMatrix_parcsr.c:3318-3320 - exec | 0 | 0 |
○Loop 3341 - IJMatrix_parcsr.c:3359-3362 - exec | 0 | 0 |
○Loop 3342 - IJMatrix_parcsr.c:3359-3362 - exec | 0 | 0 |
▼Loop 3332 - IJMatrix_parcsr.c:3262-3484 - exec– | 0 | 0 |
▼Loop 3333 - IJMatrix_parcsr.c:3473-3484 - exec– | 0 | 0 |
○Loop 3335 - IJMatrix_parcsr.c:3478-3484 - exec | 0 | 0 |
○Loop 3334 - IJMatrix_parcsr.c:3478-3484 - exec | 0 | 0 |
▼Loop 3336 - IJMatrix_parcsr.c:3475-3484 - exec– | 0 | 0 |
○Loop 3337 - IJMatrix_parcsr.c:3478-3484 - exec | 0 | 0 |
○Loop 3347 - IJMatrix_parcsr.c:3274-3275 - exec | 0.01 | 0 |
○Loop 3346 - IJMatrix_parcsr.c:3282-3283 - exec | 0 | 0 |
○Loop 3345 - IJMatrix_parcsr.c:3282-3283 - exec | 0 | 0 |