Function: hypre_IJMatrixSetValuesOMPParCSR.extracted.28 | Module: exec | Source: IJMatrix_parcsr.c:3240-3484 [...] | Coverage: 0.81% |
---|
Function: hypre_IJMatrixSetValuesOMPParCSR.extracted.28 | Module: exec | Source: IJMatrix_parcsr.c:3240-3484 [...] | Coverage: 0.81% |
---|
/scratch_na/users/xoserete/qaas_runs/171-172-8217/intel/AMG/build/AMG/AMG/IJ_mv/IJMatrix_parcsr.c: 3240 - 3484 |
-------------------------------------------------------------------------------- |
3240: #pragma omp parallel |
[...] |
3256: num_threads = hypre_NumActiveThreads(); |
3257: my_thread_num = hypre_GetThreadNum(); |
3258: |
3259: len = nrows/num_threads; |
3260: rest = nrows - len*num_threads; |
3261: |
3262: if (my_thread_num < rest) |
3263: { |
3264: ns = my_thread_num*(len+1); |
3265: ne = (my_thread_num+1)*(len+1); |
3266: } |
3267: else |
3268: { |
3269: ns = my_thread_num*len+rest; |
3270: ne = (my_thread_num+1)*len+rest; |
3271: } |
3272: |
3273: value_start[my_thread_num] = 0; |
3274: for (ii=ns; ii < ne; ii++) |
3275: value_start[my_thread_num] += ncols[ii]; |
3276: |
3277: #ifdef HYPRE_USING_OPENMP |
3278: #pragma omp barrier |
3279: #endif |
3280: if (my_thread_num == 0) |
3281: { |
3282: for (i=0; i < max_num_threads; i++) |
3283: value_start[i+1] += value_start[i]; |
[...] |
3289: if (my_thread_num) |
3290: indx = value_start[my_thread_num-1]; |
3291: for (ii=ns; ii < ne; ii++) |
3292: { |
3293: row = rows[ii]; |
3294: n = ncols[ii]; |
3295: /* processor owns the row */ |
3296: if (row >= row_partitioning[pstart] && row < row_partitioning[pstart+1]) |
3297: { |
3298: row_local = row - row_partitioning[pstart]; |
3299: /* compute local row number */ |
3300: if (need_aux) |
3301: { |
3302: local_j = aux_j[row_local]; |
3303: local_data = aux_data[row_local]; |
3304: space = row_space[row_local]; |
3305: old_size = row_length[row_local]; |
3306: size = space - old_size; |
3307: if (size < n) |
3308: { |
3309: size = n - size; |
3310: tmp_j = hypre_CTAlloc(HYPRE_Int,size); |
3311: tmp_data = hypre_CTAlloc(HYPRE_Complex,size); |
3312: } |
3313: tmp_indx = 0; |
3314: not_found = 1; |
3315: size = old_size; |
3316: for (i=0; i < n; i++) |
3317: { |
3318: for (j=0; j < old_size; j++) |
3319: { |
3320: if (local_j[j] == cols[indx]) |
3321: { |
3322: local_data[j] = values[indx]; |
[...] |
3329: if (size < space) |
3330: { |
3331: local_j[size] = cols[indx]; |
3332: local_data[size++] = values[indx]; |
3333: } |
3334: else |
3335: { |
3336: tmp_j[tmp_indx] = cols[indx]; |
3337: tmp_data[tmp_indx++] = values[indx]; |
[...] |
3344: row_length[row_local] = size+tmp_indx; |
3345: |
3346: if (tmp_indx) |
3347: { |
3348: aux_j[row_local] = hypre_TReAlloc(aux_j[row_local],HYPRE_Int, |
3349: size+tmp_indx); |
3350: aux_data[row_local] = hypre_TReAlloc(aux_data[row_local], |
3351: HYPRE_Complex,size+tmp_indx); |
3352: row_space[row_local] = size+tmp_indx; |
3353: local_j = aux_j[row_local]; |
[...] |
3359: for (i=0; i < tmp_indx; i++) |
3360: { |
3361: local_j[cnt] = tmp_j[i]; |
3362: local_data[cnt++] = tmp_data[i]; |
3363: } |
3364: |
3365: if (tmp_j) |
3366: { |
3367: hypre_TFree(tmp_j); |
3368: hypre_TFree(tmp_data); |
[...] |
3376: offd_indx = hypre_AuxParCSRMatrixIndxOffd(aux_matrix)[row_local]; |
3377: diag_indx = hypre_AuxParCSRMatrixIndxDiag(aux_matrix)[row_local]; |
3378: cnt_diag = diag_indx; |
3379: cnt_offd = offd_indx; |
3380: diag_space = diag_i[row_local+1]; |
3381: offd_space = offd_i[row_local+1]; |
3382: not_found = 1; |
3383: for (i=0; i < n; i++) |
3384: { |
3385: if (cols[indx] < col_0 || cols[indx] > col_n) |
3386: /* insert into offd */ |
3387: { |
3388: for (j=offd_i[row_local]; j < offd_indx; j++) |
3389: { |
3390: if (offd_j[j] == cols[indx]) |
3391: { |
3392: offd_data[j] = values[indx]; |
[...] |
3399: if (cnt_offd < offd_space) |
3400: { |
3401: offd_j[cnt_offd] = cols[indx]; |
3402: offd_data[cnt_offd++] = values[indx]; |
3403: } |
3404: else |
3405: { |
3406: hypre_error(HYPRE_ERROR_GENERIC); |
3407: #ifdef HYPRE_USING_OPENMP |
3408: #pragma omp atomic |
3409: #endif |
3410: error_flag++; |
[...] |
3422: for (j=diag_i[row_local]; j < diag_indx; j++) |
3423: { |
3424: if (diag_j[j] == cols[indx]) |
3425: { |
3426: diag_data[j] = values[indx]; |
[...] |
3433: if (cnt_diag < diag_space) |
3434: { |
3435: diag_j[cnt_diag] = cols[indx]; |
3436: diag_data[cnt_diag++] = values[indx]; |
3437: } |
3438: else |
3439: { |
3440: hypre_error(HYPRE_ERROR_GENERIC); |
3441: #ifdef HYPRE_USING_OPENMP |
3442: #pragma omp atomic |
3443: #endif |
3444: error_flag++; |
3445: if (print_level) |
[...] |
3454: indx++; |
3455: } |
3456: |
3457: hypre_AuxParCSRMatrixIndxDiag(aux_matrix)[row_local] = cnt_diag; |
3458: hypre_AuxParCSRMatrixIndxOffd(aux_matrix)[row_local] = cnt_offd; |
[...] |
3466: indx += n; |
3467: if (aux_matrix) |
3468: { |
3469: col_indx = 0; |
3470: for (i=0; i < off_proc_i_indx; i=i+2) |
3471: { |
3472: row_len = off_proc_i[i+1]; |
3473: if (off_proc_i[i] == row) |
3474: { |
3475: for (j=0; j < n; j++) |
3476: { |
3477: cnt1 = col_indx; |
3478: for (k=0; k < row_len; k++) |
3479: { |
3480: if (off_proc_j[cnt1] == cols[j]) |
3481: { |
3482: off_proc_j[cnt1++] = -1; |
3483: /*cancel_indx++;*/ |
3484: offproc_cnt[my_thread_num]++; |
0x4c3fd0 PUSH %RBP |
0x4c3fd1 MOV %RSP,%RBP |
0x4c3fd4 PUSH %R15 |
0x4c3fd6 PUSH %R14 |
0x4c3fd8 PUSH %R13 |
0x4c3fda PUSH %R12 |
0x4c3fdc PUSH %RBX |
0x4c3fdd SUB $0x98,%RSP |
0x4c3fe4 MOV %R9,%RBX |
0x4c3fe7 MOV %R8,-0xa8(%RBP) |
0x4c3fee MOV %RCX,-0x38(%RBP) |
0x4c3ff2 MOV %RDX,%R15 |
0x4c3ff5 MOV %RDI,%R12 |
0x4c3ff8 CALL 4d7300 <hypre_NumActiveThreads> |
0x4c3ffd MOV %RAX,%R13 |
0x4c4000 CALL 4d7310 <hypre_GetThreadNum> |
0x4c4005 MOV %RAX,%R14 |
0x4c4008 MOV %R13,%RAX |
0x4c400b OR %R15,%RAX |
0x4c400e SHR $0x20,%RAX |
0x4c4012 JE 4c401e |
0x4c4014 MOV %R15,%RAX |
0x4c4017 CQTO |
0x4c4019 IDIV %R13 |
0x4c401c JMP 4c4026 |
0x4c401e MOV %R15D,%EAX |
0x4c4021 XOR %EDX,%EDX |
0x4c4023 DIV %R13D |
0x4c4026 MOV -0x38(%RBP),%RSI |
0x4c402a MOV %R12,%R13 |
0x4c402d MOV 0xb8(%RBP),%R15 |
0x4c4034 LEA 0x1(%R14),%RCX |
0x4c4038 CMP %RDX,%R14 |
0x4c403b JGE 4c404e |
0x4c403d LEA 0x1(%RAX),%R8 |
0x4c4041 MOV %R8,%RDI |
0x4c4044 IMUL %R14,%RDI |
0x4c4048 IMUL %RCX,%R8 |
0x4c404c JMP 4c4062 |
0x4c404e MOV %RAX,%RDI |
0x4c4051 IMUL %R14,%RDI |
0x4c4055 ADD %RDX,%RDI |
0x4c4058 IMUL %RAX,%RCX |
0x4c405c ADD %RDX,%RCX |
0x4c405f MOV %RCX,%R8 |
0x4c4062 MOVQ $0,(%R15,%R14,8) |
0x4c406a MOV %RDI,%R12 |
0x4c406d CMP %R8,%RDI |
0x4c4070 MOV %R8,-0x40(%RBP) |
0x4c4074 JGE 4c413f |
0x4c407a LEA (%R15,%R14,8),%RCX |
0x4c407e MOV %RSI,%RDI |
0x4c4081 LEA -0x8(%RSI,%R8,8),%R8 |
0x4c4086 CMP %RDX,%R14 |
0x4c4089 CMOVL %R14,%RDX |
0x4c408d IMUL %R14,%RAX |
0x4c4091 LEA (%RDX,%RAX,1),%RSI |
0x4c4095 LEA (%RDI,%RSI,8),%RDI |
0x4c4099 CMP %RCX,%R8 |
0x4c409c JB 4c40c1 |
0x4c409e CMP %RDI,%RCX |
0x4c40a1 JB 4c40c1 |
0x4c40a3 XOR %EAX,%EAX |
0x4c40a5 MOV %R12,%RDX |
0x4c40a8 MOV -0x38(%RBP),%RSI |
0x4c40ac MOV -0x40(%RBP),%RDI |
(3832) 0x4c40b0 ADD (%RSI,%RDX,8),%RAX |
(3832) 0x4c40b4 MOV %RAX,(%RCX) |
(3832) 0x4c40b7 INC %RDX |
(3832) 0x4c40ba CMP %RDX,%RDI |
(3832) 0x4c40bd JNE 4c40b0 |
0x4c40bf JMP 4c413f |
0x4c40c1 MOV -0x40(%RBP),%R8 |
0x4c40c5 SUB %RSI,%R8 |
0x4c40c8 MOV %R8,%RSI |
0x4c40cb AND $-0x4,%RSI |
0x4c40cf JE 4c4116 |
0x4c40d1 LEA -0x1(%RSI),%R9 |
0x4c40d5 VPXOR %XMM0,%XMM0,%XMM0 |
0x4c40d9 XOR %R10D,%R10D |
0x4c40dc NOPL (%RAX) |
(3831) 0x4c40e0 VPADDQ (%RDI,%R10,8),%YMM0,%YMM0 |
(3831) 0x4c40e6 ADD $0x4,%R10 |
(3831) 0x4c40ea CMP %R9,%R10 |
(3831) 0x4c40ed JBE 4c40e0 |
0x4c40ef VEXTRACTI128 $0x1,%YMM0,%XMM1 |
0x4c40f5 VPADDQ %XMM1,%XMM0,%XMM0 |
0x4c40f9 VPSHUFD $-0x12,%XMM0,%XMM1 |
0x4c40fe VPADDQ %XMM1,%XMM0,%XMM0 |
0x4c4102 VMOVQ %XMM0,%RDI |
0x4c4107 CMP %RSI,%R8 |
0x4c410a MOV -0x38(%RBP),%R8 |
0x4c410e MOV -0x40(%RBP),%R9 |
0x4c4112 JNE 4c4122 |
0x4c4114 JMP 4c413c |
0x4c4116 XOR %ESI,%ESI |
0x4c4118 XOR %EDI,%EDI |
0x4c411a MOV -0x38(%RBP),%R8 |
0x4c411e MOV -0x40(%RBP),%R9 |
0x4c4122 ADD %RDX,%RSI |
0x4c4125 ADD %RAX,%RSI |
0x4c4128 NOPL (%RAX,%RAX,1) |
(3830) 0x4c4130 ADD (%R8,%RSI,8),%RDI |
(3830) 0x4c4134 INC %RSI |
(3830) 0x4c4137 CMP %RSI,%R9 |
(3830) 0x4c413a JNE 4c4130 |
0x4c413c MOV %RDI,(%RCX) |
0x4c413f MOV (%R13),%ESI |
0x4c4143 MOV $0x719570,%EDI |
0x4c4148 VZEROUPPER |
0x4c414b CALL 40fed0 <__kmpc_barrier@plt> |
0x4c4150 TEST %R14,%R14 |
0x4c4153 JNE 4c41f4 |
0x4c4159 MOV 0xc8(%RBP),%RAX |
0x4c4160 TEST %RAX,%RAX |
0x4c4163 JLE 4c41f4 |
0x4c4169 CMP $0x8,%RAX |
0x4c416d JB 4c41c7 |
0x4c416f MOV %RAX,%RCX |
0x4c4172 SHR $0x3,%RCX |
0x4c4176 MOV (%R15),%RDX |
0x4c4179 LEA 0x40(%R15),%RSI |
0x4c417d NOPL (%RAX) |
(3829) 0x4c4180 ADD -0x38(%RSI),%RDX |
(3829) 0x4c4184 MOV %RDX,-0x38(%RSI) |
(3829) 0x4c4188 ADD -0x30(%RSI),%RDX |
(3829) 0x4c418c MOV %RDX,-0x30(%RSI) |
(3829) 0x4c4190 ADD -0x28(%RSI),%RDX |
(3829) 0x4c4194 MOV %RDX,-0x28(%RSI) |
(3829) 0x4c4198 ADD -0x20(%RSI),%RDX |
(3829) 0x4c419c MOV %RDX,-0x20(%RSI) |
(3829) 0x4c41a0 ADD -0x18(%RSI),%RDX |
(3829) 0x4c41a4 MOV %RDX,-0x18(%RSI) |
(3829) 0x4c41a8 ADD -0x10(%RSI),%RDX |
(3829) 0x4c41ac MOV %RDX,-0x10(%RSI) |
(3829) 0x4c41b0 ADD -0x8(%RSI),%RDX |
(3829) 0x4c41b4 MOV %RDX,-0x8(%RSI) |
(3829) 0x4c41b8 ADD (%RSI),%RDX |
(3829) 0x4c41bb MOV %RDX,(%RSI) |
(3829) 0x4c41be ADD $0x40,%RSI |
(3829) 0x4c41c2 DEC %RCX |
(3829) 0x4c41c5 JNE 4c4180 |
0x4c41c7 MOV %RAX,%RCX |
0x4c41ca AND $-0x8,%RCX |
0x4c41ce CMP %RAX,%RCX |
0x4c41d1 JAE 4c41f4 |
0x4c41d3 MOV (%R15,%RCX,8),%RDX |
0x4c41d7 NOPW (%RAX,%RAX,1) |
(3828) 0x4c41e0 LEA (%R15,%RCX,8),%RSI |
(3828) 0x4c41e4 INC %RCX |
(3828) 0x4c41e7 ADD 0x8(%RSI),%RDX |
(3828) 0x4c41eb MOV %RDX,0x8(%RSI) |
(3828) 0x4c41ef CMP %RCX,%RAX |
(3828) 0x4c41f2 JNE 4c41e0 |
0x4c41f4 MOV (%R13),%ESI |
0x4c41f8 MOV $0x719590,%EDI |
0x4c41fd CALL 40fed0 <__kmpc_barrier@plt> |
0x4c4202 TEST %R14,%R14 |
0x4c4205 JE 4c4212 |
0x4c4207 MOV -0x8(%R15,%R14,8),%RAX |
0x4c420c MOV %RAX,-0x60(%RBP) |
0x4c4210 JMP 4c421a |
0x4c4212 MOVQ $0,-0x60(%RBP) |
0x4c421a MOV -0x38(%RBP),%RDX |
0x4c421e MOV %R12,%RSI |
0x4c4221 MOV -0x40(%RBP),%RDI |
0x4c4225 CMP %RDI,%R12 |
0x4c4228 JGE 4c4e03 |
0x4c422e MOV 0xb0(%RBP),%RAX |
0x4c4235 MOV 0xa8(%RBP),%RCX |
0x4c423c MOV 0x98(%RBP),%R8 |
0x4c4243 LEA (%RAX,%R14,8),%R15 |
0x4c4247 LEA -0x1(%R8),%RAX |
0x4c424b SHR $0x1,%RAX |
0x4c424e MOV %RAX,-0xb8(%RBP) |
0x4c4255 MOV 0x20(%RBP),%R8 |
0x4c4259 LEA 0x18(%RCX),%RAX |
0x4c425d MOV %RAX,-0xb0(%RBP) |
0x4c4264 MOVQ $0,-0x88(%RBP) |
0x4c426f JMP 4c42d4 |
(3807) 0x4c4271 SAL $0x3,%RDX |
(3807) 0x4c4275 MOV %RDX,-0x58(%RBP) |
(3807) 0x4c4279 MOV %R13,%RSI |
(3807) 0x4c427c MOV %R8,%R14 |
(3807) 0x4c427f MOV %R10,%R12 |
(3807) 0x4c4282 CALL 4dec60 <__intel_avx_rep_memcpy> |
(3807) 0x4c4287 MOV %R12,%RDI |
(3807) 0x4c428a MOV %R14,%RSI |
(3807) 0x4c428d MOV -0x58(%RBP),%RDX |
(3807) 0x4c4291 CALL 4dec60 <__intel_avx_rep_memcpy> |
(3807) 0x4c4296 MOV %R13,%RDI |
(3807) 0x4c4299 VZEROUPPER |
(3807) 0x4c429c CALL 4d5720 <hypre_Free> |
(3807) 0x4c42a1 MOV -0x88(%RBP),%RDI |
(3807) 0x4c42a8 CALL 4d5720 <hypre_Free> |
(3807) 0x4c42ad MOVQ $0,-0x88(%RBP) |
(3807) 0x4c42b8 MOV -0x38(%RBP),%RDX |
(3807) 0x4c42bc MOV -0x68(%RBP),%RSI |
(3807) 0x4c42c0 MOV -0x40(%RBP),%RDI |
(3807) 0x4c42c4 MOV 0x20(%RBP),%R8 |
(3807) 0x4c42c8 INC %RSI |
(3807) 0x4c42cb CMP %RDI,%RSI |
(3807) 0x4c42ce JGE 4c4e03 |
(3807) 0x4c42d4 MOV -0xa8(%RBP),%RAX |
(3807) 0x4c42db MOV (%RAX,%RSI,8),%R10 |
(3807) 0x4c42df MOV (%RDX,%RSI,8),%R9 |
(3807) 0x4c42e3 MOV %R10,-0x58(%RBP) |
(3807) 0x4c42e7 SUB (%R8),%R10 |
(3807) 0x4c42ea MOV %R9,-0x50(%RBP) |
(3807) 0x4c42ee JL 4c43a0 |
(3807) 0x4c42f4 MOV -0x58(%RBP),%RAX |
(3807) 0x4c42f8 CMP 0x8(%R8),%RAX |
(3807) 0x4c42fc JGE 4c43a0 |
(3807) 0x4c4302 CMPQ $0,0x58(%RBP) |
(3807) 0x4c4307 MOV %R10,-0x30(%RBP) |
(3807) 0x4c430b JE 4c45bf |
(3807) 0x4c4311 MOV 0x38(%RBP),%RAX |
(3807) 0x4c4315 MOV (%RAX,%R10,8),%R13 |
(3807) 0x4c4319 MOV 0x40(%RBP),%RAX |
(3807) 0x4c431d MOV (%RAX,%R10,8),%RAX |
(3807) 0x4c4321 MOV %RAX,-0x48(%RBP) |
(3807) 0x4c4325 MOV 0x50(%RBP),%RAX |
(3807) 0x4c4329 MOV (%RAX,%R10,8),%RCX |
(3807) 0x4c432d MOV 0x48(%RBP),%RAX |
(3807) 0x4c4331 MOV (%RAX,%R10,8),%R12 |
(3807) 0x4c4335 MOV %RCX,-0x80(%RBP) |
(3807) 0x4c4339 MOV %RCX,%RAX |
(3807) 0x4c433c SUB %R12,%RAX |
(3807) 0x4c433f MOV %R9,%R14 |
(3807) 0x4c4342 SUB %RAX,%R14 |
(3807) 0x4c4345 MOV %RSI,-0x68(%RBP) |
(3807) 0x4c4349 JLE 4c49c5 |
(3807) 0x4c434f MOV $0x8,%ESI |
(3807) 0x4c4354 MOV %R14,%RDI |
(3807) 0x4c4357 VZEROUPPER |
(3807) 0x4c435a CALL 4d5650 <hypre_CAlloc> |
(3807) 0x4c435f MOV %RAX,-0x70(%RBP) |
(3807) 0x4c4363 MOV $0x8,%ESI |
(3807) 0x4c4368 MOV %R14,%RDI |
(3807) 0x4c436b CALL 4d5650 <hypre_CAlloc> |
(3807) 0x4c4370 MOV -0x30(%RBP),%R10 |
(3807) 0x4c4374 MOV -0x50(%RBP),%R9 |
(3807) 0x4c4378 MOV %RAX,-0x88(%RBP) |
(3807) 0x4c437f TEST %R9,%R9 |
(3807) 0x4c4382 JG 4c49d6 |
(3807) 0x4c4388 MOV 0x48(%RBP),%RAX |
(3807) 0x4c438c MOV %R12,(%RAX,%R10,8) |
(3807) 0x4c4390 JMP 4c4cb6 |
0x4c4395 NOPW %CS:(%RAX,%RAX,1) |
(3807) 0x4c43a0 ADD %R9,-0x60(%RBP) |
(3807) 0x4c43a4 MOV 0x18(%RBP),%RAX |
(3807) 0x4c43a8 CMPQ $0,(%RAX) |
(3807) 0x4c43ac JE 4c42c8 |
(3807) 0x4c43b2 CMPQ $0,0x98(%RBP) |
(3807) 0x4c43ba JLE 4c42c8 |
(3807) 0x4c43c0 MOV %RSI,-0x68(%RBP) |
(3807) 0x4c43c4 CMP %RBX,%R15 |
(3807) 0x4c43c7 SETB %CL |
(3807) 0x4c43ca LEA -0x1(%R9),%RAX |
(3807) 0x4c43ce LEA -0x8(%RBX,%R9,8),%RDX |
(3807) 0x4c43d3 MOV %RDX,-0x80(%RBP) |
(3807) 0x4c43d7 CMP %R15,%RDX |
(3807) 0x4c43da SETB %DL |
(3807) 0x4c43dd OR %CL,%DL |
(3807) 0x4c43df MOV %DL,-0x48(%RBP) |
(3807) 0x4c43e2 XOR %EDI,%EDI |
(3807) 0x4c43e4 XOR %ESI,%ESI |
(3807) 0x4c43e6 JMP 4c4404 |
0x4c43e8 NOPL (%RAX,%RAX,1) |
(3808) 0x4c43f0 LEA 0x1(%RSI),%RCX |
(3808) 0x4c43f4 CMP -0xb8(%RBP),%RSI |
(3808) 0x4c43fb MOV %RCX,%RSI |
(3808) 0x4c43fe JE 4c42b8 |
(3808) 0x4c4404 MOV %RDI,%RDX |
(3808) 0x4c4407 MOV %RSI,%RCX |
(3808) 0x4c440a SAL $0x4,%RCX |
(3808) 0x4c440e MOV 0xa0(%RBP),%R9 |
(3808) 0x4c4415 MOV 0x8(%R9,%RCX,1),%R8 |
(3808) 0x4c441a ADD %R8,%RDI |
(3808) 0x4c441d MOV -0x58(%RBP),%R10 |
(3808) 0x4c4421 CMP %R10,(%R9,%RCX,1) |
(3808) 0x4c4425 JNE 4c43f0 |
(3808) 0x4c4427 CMPQ $0,-0x50(%RBP) |
(3808) 0x4c442c JLE 4c43f0 |
(3808) 0x4c442e MOV 0xa8(%RBP),%R9 |
(3808) 0x4c4435 LEA -0x8(%R9,%RDI,8),%RCX |
(3808) 0x4c443a CMP %R15,%RCX |
(3808) 0x4c443d SETB %R10B |
(3808) 0x4c4441 LEA (%R9,%RDX,8),%R9 |
(3808) 0x4c4445 CMP %R9,%R15 |
(3808) 0x4c4448 SETB %R11B |
(3808) 0x4c444c OR %R10B,%R11B |
(3808) 0x4c444f CMP %RBX,%RCX |
(3808) 0x4c4452 SETB %CL |
(3808) 0x4c4455 CMP %R9,-0x80(%RBP) |
(3808) 0x4c4459 SETB %R10B |
(3808) 0x4c445d OR %CL,%R10B |
(3808) 0x4c4460 AND %R11B,%R10B |
(3808) 0x4c4463 TEST %R10B,-0x48(%RBP) |
(3808) 0x4c4467 JE 4c4570 |
(3808) 0x4c446d MOV %R8,%RCX |
(3808) 0x4c4470 SHR $0x2,%RCX |
(3808) 0x4c4474 MOV %R8,%R11 |
(3808) 0x4c4477 AND $-0x4,%R11 |
(3808) 0x4c447b MOV -0xb0(%RBP),%R10 |
(3808) 0x4c4482 LEA (%R10,%RDX,8),%RDX |
(3808) 0x4c4486 XOR %R13D,%R13D |
(3808) 0x4c4489 JMP 4c44a0 |
0x4c448b NOPL (%RAX,%RAX,1) |
(3811) 0x4c4490 LEA 0x1(%R13),%R10 |
(3811) 0x4c4494 CMP %RAX,%R13 |
(3811) 0x4c4497 MOV %R10,%R13 |
(3811) 0x4c449a JE 4c43f0 |
(3811) 0x4c44a0 TEST %R8,%R8 |
(3811) 0x4c44a3 JLE 4c4490 |
(3811) 0x4c44a5 MOV (%RBX,%R13,8),%R14 |
(3811) 0x4c44a9 CMP $0x4,%R8 |
(3811) 0x4c44ad JAE 4c44e0 |
(3811) 0x4c44af CMP %R8,%R11 |
(3811) 0x4c44b2 JAE 4c4490 |
(3811) 0x4c44b4 MOV %R11,%R10 |
(3811) 0x4c44b7 JMP 4c44c8 |
0x4c44b9 NOPL (%RAX) |
(3812) 0x4c44c0 INC %R10 |
(3812) 0x4c44c3 CMP %R10,%R8 |
(3812) 0x4c44c6 JE 4c4490 |
(3812) 0x4c44c8 CMP %R14,(%R9,%R10,8) |
(3812) 0x4c44cc JNE 4c44c0 |
(3812) 0x4c44ce MOVQ $-0x1,(%R9,%R10,8) |
(3812) 0x4c44d6 INCQ (%R15) |
(3812) 0x4c44d9 JMP 4c44c0 |
0x4c44db NOPL (%RAX,%RAX,1) |
(3811) 0x4c44e0 MOV %RCX,%R10 |
(3811) 0x4c44e3 MOV %RDX,%R12 |
(3811) 0x4c44e6 JMP 4c44f9 |
0x4c44e8 NOPL (%RAX,%RAX,1) |
(3813) 0x4c44f0 ADD $0x20,%R12 |
(3813) 0x4c44f4 DEC %R10 |
(3813) 0x4c44f7 JE 4c44af |
(3813) 0x4c44f9 CMP %R14,-0x18(%R12) |
(3813) 0x4c44fe JE 4c4520 |
(3813) 0x4c4500 CMP %R14,-0x10(%R12) |
(3813) 0x4c4505 JE 4c4533 |
(3813) 0x4c4507 CMP %R14,-0x8(%R12) |
(3813) 0x4c450c JE 4c4546 |
(3813) 0x4c450e CMP %R14,(%R12) |
(3813) 0x4c4512 JNE 4c44f0 |
(3813) 0x4c4514 JMP 4c4558 |
0x4c4516 NOPW %CS:(%RAX,%RAX,1) |
(3813) 0x4c4520 MOVQ $-0x1,-0x18(%R12) |
(3813) 0x4c4529 INCQ (%R15) |
(3813) 0x4c452c CMP %R14,-0x10(%R12) |
(3813) 0x4c4531 JNE 4c4507 |
(3813) 0x4c4533 MOVQ $-0x1,-0x10(%R12) |
(3813) 0x4c453c INCQ (%R15) |
(3813) 0x4c453f CMP %R14,-0x8(%R12) |
(3813) 0x4c4544 JNE 4c450e |
(3813) 0x4c4546 MOVQ $-0x1,-0x8(%R12) |
(3813) 0x4c454f INCQ (%R15) |
(3813) 0x4c4552 CMP %R14,(%R12) |
(3813) 0x4c4556 JNE 4c44f0 |
(3813) 0x4c4558 MOVQ $-0x1,(%R12) |
(3813) 0x4c4560 INCQ (%R15) |
(3813) 0x4c4563 JMP 4c44f0 |
0x4c4565 NOPW %CS:(%RAX,%RAX,1) |
(3808) 0x4c4570 XOR %ECX,%ECX |
(3808) 0x4c4572 JMP 4c4590 |
0x4c4574 NOPW %CS:(%RAX,%RAX,1) |
(3809) 0x4c4580 LEA 0x1(%RCX),%RDX |
(3809) 0x4c4584 CMP %RAX,%RCX |
(3809) 0x4c4587 MOV %RDX,%RCX |
(3809) 0x4c458a JE 4c43f0 |
(3809) 0x4c4590 TEST %R8,%R8 |
(3809) 0x4c4593 JLE 4c4580 |
(3809) 0x4c4595 XOR %EDX,%EDX |
(3809) 0x4c4597 JMP 4c45a8 |
0x4c4599 NOPL (%RAX) |
(3810) 0x4c45a0 INC %RDX |
(3810) 0x4c45a3 CMP %RDX,%R8 |
(3810) 0x4c45a6 JE 4c4580 |
(3810) 0x4c45a8 MOV (%R9,%RDX,8),%R10 |
(3810) 0x4c45ac CMP (%RBX,%RCX,8),%R10 |
(3810) 0x4c45b0 JNE 4c45a0 |
(3810) 0x4c45b2 MOVQ $-0x1,(%R9,%RDX,8) |
(3810) 0x4c45ba INCQ (%R15) |
(3810) 0x4c45bd JMP 4c45a0 |
(3807) 0x4c45bf MOV 0x18(%RBP),%RAX |
(3807) 0x4c45c3 MOV (%RAX),%RAX |
(3807) 0x4c45c6 MOV 0x38(%RAX),%RCX |
(3807) 0x4c45ca MOV 0x40(%RAX),%RAX |
(3807) 0x4c45ce MOV (%RAX,%R10,8),%R14 |
(3807) 0x4c45d2 MOV (%RCX,%R10,8),%R11 |
(3807) 0x4c45d6 TEST %R9,%R9 |
(3807) 0x4c45d9 JLE 4c4cc8 |
(3807) 0x4c45df MOV %RSI,-0x68(%RBP) |
(3807) 0x4c45e3 MOV 0x60(%RBP),%RAX |
(3807) 0x4c45e7 MOV 0x8(%RAX,%R10,8),%RAX |
(3807) 0x4c45ec MOV %RAX,-0x70(%RBP) |
(3807) 0x4c45f0 MOV 0x78(%RBP),%RAX |
(3807) 0x4c45f4 MOV 0x8(%RAX,%R10,8),%RAX |
(3807) 0x4c45f9 MOV %RAX,-0x90(%RBP) |
(3807) 0x4c4600 MOV -0x60(%RBP),%RDX |
(3807) 0x4c4604 LEA (%RDX,%R9,1),%RAX |
(3807) 0x4c4608 MOV %RAX,-0x98(%RBP) |
(3807) 0x4c460f XOR %R8D,%R8D |
(3807) 0x4c4612 MOV %R14,-0x48(%RBP) |
(3807) 0x4c4616 MOV %R11,-0x80(%RBP) |
(3807) 0x4c461a MOV %R11,-0x78(%RBP) |
(3807) 0x4c461e MOV 0x88(%RBP),%RDI |
(3807) 0x4c4625 MOV %R14,%RCX |
(3807) 0x4c4628 JMP 4c464a |
0x4c462a NOPW (%RAX,%RAX,1) |
(3814) 0x4c4630 MOV -0x50(%RBP),%RSI |
(3814) 0x4c4634 MOV -0x30(%RBP),%R10 |
(3814) 0x4c4638 MOV %RCX,%R14 |
(3814) 0x4c463b INC %RDX |
(3814) 0x4c463e INC %R8 |
(3814) 0x4c4641 CMP %RSI,%R8 |
(3814) 0x4c4644 JE 4c4cd0 |
(3814) 0x4c464a MOV (%RBX,%RDX,8),%R9 |
(3814) 0x4c464e CMP 0x28(%RBP),%R9 |
(3814) 0x4c4652 JL 4c47c0 |
(3814) 0x4c4658 CMP 0x30(%RBP),%R9 |
(3814) 0x4c465c JG 4c47c0 |
(3814) 0x4c4662 MOV 0x60(%RBP),%RAX |
(3814) 0x4c4666 MOV (%RAX,%R10,8),%R10 |
(3814) 0x4c466a MOV -0x80(%RBP),%R11 |
(3814) 0x4c466e SUB %R10,%R11 |
(3814) 0x4c4671 JLE 4c4780 |
(3814) 0x4c4677 MOV %RDX,%RAX |
(3814) 0x4c467a MOV 0x68(%RBP),%RDX |
(3814) 0x4c467e LEA (%RDX,%R10,8),%EDX |
(3814) 0x4c4682 AND $0x7f,%EDX |
(3814) 0x4c4685 MOV $0x80,%ESI |
(3814) 0x4c468a SUB %EDX,%ESI |
(3814) 0x4c468c SHR $0x3,%ESI |
(3814) 0x4c468f CMP %RSI,%R11 |
(3814) 0x4c4692 MOV %RSI,%R14 |
(3814) 0x4c4695 CMOVB %R11,%R14 |
(3814) 0x4c4699 TEST %R14,%R14 |
(3814) 0x4c469c JE 4c46c7 |
(3814) 0x4c469e MOV %R10,%R12 |
(3814) 0x4c46a1 MOV %R14,%RDX |
(3814) 0x4c46a4 NOPW %CS:(%RAX,%RAX,1) |
(3820) 0x4c46b0 MOV 0x68(%RBP),%R13 |
(3820) 0x4c46b4 CMP %R9,(%R13,%R12,8) |
(3820) 0x4c46b9 JE 4c4916 |
(3820) 0x4c46bf INC %R12 |
(3820) 0x4c46c2 DEC %RDX |
(3820) 0x4c46c5 JNE 4c46b0 |
(3814) 0x4c46c7 CMP %RSI,%R11 |
(3814) 0x4c46ca MOV %RAX,%RDX |
(3814) 0x4c46cd JBE 4c4780 |
(3814) 0x4c46d3 SUB %R14,%R11 |
(3814) 0x4c46d6 MOV %R11,%R13 |
(3814) 0x4c46d9 AND $-0x10,%R13 |
(3814) 0x4c46dd JE 4c473a |
(3814) 0x4c46df LEA -0x1(%R13),%RDX |
(3814) 0x4c46e3 LEA (%R10,%R14,1),%R12 |
(3814) 0x4c46e7 VPBROADCASTQ %R9,%YMM0 |
(3814) 0x4c46ed MOV 0x68(%RBP),%RSI |
(3814) 0x4c46f1 LEA (%RSI,%R12,8),%RDI |
(3814) 0x4c46f5 XOR %ESI,%ESI |
(3814) 0x4c46f7 NOPW (%RAX,%RAX,1) |
(3819) 0x4c4700 VPCMPEQQ 0x20(%RDI,%RSI,8),%YMM0,%K0 |
(3819) 0x4c4708 VPCMPEQQ (%RDI,%RSI,8),%YMM0,%K1 |
(3819) 0x4c470f VPCMPEQQ 0x60(%RDI,%RSI,8),%YMM0,%K2 |
(3819) 0x4c4717 VPCMPEQQ 0x40(%RDI,%RSI,8),%YMM0,%K3 |
(3819) 0x4c471f KORB %K0,%K1,%K4 |
(3819) 0x4c4723 KORB %K2,%K3,%K5 |
(3819) 0x4c4727 KORTESTB %K5,%K4 |
(3819) 0x4c472b JNE 4c4923 |
(3819) 0x4c4731 ADD $0x10,%RSI |
(3819) 0x4c4735 CMP %RDX,%RSI |
(3819) 0x4c4738 JBE 4c4700 |
(3814) 0x4c473a CMP %R11,%R13 |
(3814) 0x4c473d MOV %RAX,%RDX |
(3814) 0x4c4740 MOV 0x88(%RBP),%RDI |
(3814) 0x4c4747 JAE 4c4780 |
(3814) 0x4c4749 ADD %R14,%R10 |
(3814) 0x4c474c ADD %R13,%R10 |
(3814) 0x4c474f MOV %R10,%R12 |
(3814) 0x4c4752 NOPW %CS:(%RAX,%RAX,1) |
(3818) 0x4c4760 MOV 0x68(%RBP),%RAX |
(3818) 0x4c4764 CMP %R9,(%RAX,%R12,8) |
(3818) 0x4c4768 JE 4c4953 |
(3818) 0x4c476e INC %R12 |
(3818) 0x4c4771 CMP %R12,-0x80(%RBP) |
(3818) 0x4c4775 JNE 4c4760 |
(3814) 0x4c4777 NOPW (%RAX,%RAX,1) |
(3814) 0x4c4780 MOV -0x78(%RBP),%RSI |
(3814) 0x4c4784 CMP -0x70(%RBP),%RSI |
(3814) 0x4c4788 JGE 4c4d22 |
(3814) 0x4c478e MOV 0x68(%RBP),%RAX |
(3814) 0x4c4792 MOV %R9,(%RAX,%RSI,8) |
(3814) 0x4c4796 MOV 0x10(%RBP),%RAX |
(3814) 0x4c479a VMOVQ (%RAX,%RDX,8),%XMM0 |
(3814) 0x4c479f MOV 0x70(%RBP),%RAX |
(3814) 0x4c47a3 VMOVQ %XMM0,(%RAX,%RSI,8) |
(3814) 0x4c47a8 INC %RSI |
(3814) 0x4c47ab MOV %RSI,-0x78(%RBP) |
(3814) 0x4c47af JMP 4c4630 |
0x4c47b4 NOPW %CS:(%RAX,%RAX,1) |
(3814) 0x4c47c0 MOV 0x78(%RBP),%RAX |
(3814) 0x4c47c4 MOV (%RAX,%R10,8),%R10 |
(3814) 0x4c47c8 MOV %R14,%R11 |
(3814) 0x4c47cb SUB %R10,%R11 |
(3814) 0x4c47ce JLE 4c48e0 |
(3814) 0x4c47d4 MOV %RDX,%RAX |
(3814) 0x4c47d7 MOV 0x80(%RBP),%RDX |
(3814) 0x4c47de LEA (%RDX,%R10,8),%EDX |
(3814) 0x4c47e2 AND $0x7f,%EDX |
(3814) 0x4c47e5 MOV $0x80,%ESI |
(3814) 0x4c47ea SUB %EDX,%ESI |
(3814) 0x4c47ec SHR $0x3,%ESI |
(3814) 0x4c47ef CMP %RSI,%R11 |
(3814) 0x4c47f2 MOV %RSI,%R14 |
(3814) 0x4c47f5 CMOVB %R11,%R14 |
(3814) 0x4c47f9 TEST %R14,%R14 |
(3814) 0x4c47fc JE 4c482a |
(3814) 0x4c47fe MOV %R10,%R12 |
(3814) 0x4c4801 MOV %R14,%RDX |
(3814) 0x4c4804 NOPW %CS:(%RAX,%RAX,1) |
(3817) 0x4c4810 MOV 0x80(%RBP),%R13 |
(3817) 0x4c4817 CMP %R9,(%R13,%R12,8) |
(3817) 0x4c481c JE 4c491b |
(3817) 0x4c4822 INC %R12 |
(3817) 0x4c4825 DEC %RDX |
(3817) 0x4c4828 JNE 4c4810 |
(3814) 0x4c482a CMP %RSI,%R11 |
(3814) 0x4c482d MOV %RAX,%RDX |
(3814) 0x4c4830 JBE 4c48e0 |
(3814) 0x4c4836 SUB %R14,%R11 |
(3814) 0x4c4839 MOV %R11,%R13 |
(3814) 0x4c483c AND $-0x10,%R13 |
(3814) 0x4c4840 JE 4c489a |
(3814) 0x4c4842 LEA -0x1(%R13),%RDX |
(3814) 0x4c4846 LEA (%R10,%R14,1),%R12 |
(3814) 0x4c484a VPBROADCASTQ %R9,%YMM0 |
(3814) 0x4c4850 MOV 0x80(%RBP),%RSI |
(3814) 0x4c4857 LEA (%RSI,%R12,8),%RDI |
(3814) 0x4c485b XOR %ESI,%ESI |
(3814) 0x4c485d NOPL (%RAX) |
(3816) 0x4c4860 VPCMPEQQ 0x20(%RDI,%RSI,8),%YMM0,%K0 |
(3816) 0x4c4868 VPCMPEQQ (%RDI,%RSI,8),%YMM0,%K1 |
(3816) 0x4c486f VPCMPEQQ 0x60(%RDI,%RSI,8),%YMM0,%K2 |
(3816) 0x4c4877 VPCMPEQQ 0x40(%RDI,%RSI,8),%YMM0,%K3 |
(3816) 0x4c487f KORB %K0,%K1,%K4 |
(3816) 0x4c4883 KORB %K2,%K3,%K5 |
(3816) 0x4c4887 KORTESTB %K5,%K4 |
(3816) 0x4c488b JNE 4c4976 |
(3816) 0x4c4891 ADD $0x10,%RSI |
(3816) 0x4c4895 CMP %RDX,%RSI |
(3816) 0x4c4898 JBE 4c4860 |
(3814) 0x4c489a CMP %R11,%R13 |
(3814) 0x4c489d MOV %RAX,%RDX |
(3814) 0x4c48a0 MOV 0x88(%RBP),%RDI |
(3814) 0x4c48a7 JAE 4c48e0 |
(3814) 0x4c48a9 ADD %R14,%R10 |
(3814) 0x4c48ac ADD %R13,%R10 |
(3814) 0x4c48af MOV %R10,%R12 |
(3814) 0x4c48b2 NOPW %CS:(%RAX,%RAX,1) |
(3815) 0x4c48c0 MOV 0x80(%RBP),%RAX |
(3815) 0x4c48c7 CMP %R9,(%RAX,%R12,8) |
(3815) 0x4c48cb JE 4c49a6 |
(3815) 0x4c48d1 INC %R12 |
(3815) 0x4c48d4 CMP %R12,%RCX |
(3815) 0x4c48d7 JNE 4c48c0 |
(3814) 0x4c48d9 NOPL (%RAX) |
(3814) 0x4c48e0 MOV -0x48(%RBP),%RSI |
(3814) 0x4c48e4 CMP -0x90(%RBP),%RSI |
(3814) 0x4c48eb JGE 4c4d5f |
(3814) 0x4c48f1 MOV 0x80(%RBP),%RAX |
(3814) 0x4c48f8 MOV %R9,(%RAX,%RSI,8) |
(3814) 0x4c48fc MOV 0x10(%RBP),%RAX |
(3814) 0x4c4900 VMOVQ (%RAX,%RDX,8),%XMM0 |
(3814) 0x4c4905 VMOVQ %XMM0,(%RDI,%RSI,8) |
(3814) 0x4c490a INC %RSI |
(3814) 0x4c490d MOV %RSI,-0x48(%RBP) |
(3814) 0x4c4911 JMP 4c4630 |
(3814) 0x4c4916 MOV %RAX,%RDX |
(3814) 0x4c4919 JMP 4c4953 |
(3814) 0x4c491b MOV %RAX,%RDX |
(3814) 0x4c491e JMP 4c49a6 |
(3814) 0x4c4923 KSHIFTLB $0x4,%K0,%K0 |
(3814) 0x4c4929 KORB %K0,%K1,%K0 |
(3814) 0x4c492d KSHIFTLB $0x4,%K2,%K1 |
(3814) 0x4c4933 KORB %K1,%K3,%K1 |
(3814) 0x4c4937 KUNPCKBW %K0,%K1,%K0 |
(3814) 0x4c493b KMOVD %K0,%EDX |
(3814) 0x4c493f TZCNT %EDX,%EDX |
(3814) 0x4c4943 ADD %RSI,%R12 |
(3814) 0x4c4946 ADD %RDX,%R12 |
(3814) 0x4c4949 MOV %RAX,%RDX |
(3814) 0x4c494c MOV 0x88(%RBP),%RDI |
(3814) 0x4c4953 MOV -0x50(%RBP),%RSI |
(3814) 0x4c4957 MOV -0x30(%RBP),%R10 |
(3814) 0x4c495b MOV %RCX,%R14 |
(3814) 0x4c495e MOV 0x10(%RBP),%RAX |
(3814) 0x4c4962 VMOVQ (%RAX,%RDX,8),%XMM0 |
(3814) 0x4c4967 MOV 0x70(%RBP),%RAX |
(3814) 0x4c496b VMOVQ %XMM0,(%RAX,%R12,8) |
(3814) 0x4c4971 JMP 4c463b |
(3814) 0x4c4976 KSHIFTLB $0x4,%K0,%K0 |
(3814) 0x4c497c KORB %K0,%K1,%K0 |
(3814) 0x4c4980 KSHIFTLB $0x4,%K2,%K1 |
(3814) 0x4c4986 KORB %K1,%K3,%K1 |
(3814) 0x4c498a KUNPCKBW %K0,%K1,%K0 |
(3814) 0x4c498e KMOVD %K0,%EDX |
(3814) 0x4c4992 TZCNT %EDX,%EDX |
(3814) 0x4c4996 ADD %RSI,%R12 |
(3814) 0x4c4999 ADD %RDX,%R12 |
(3814) 0x4c499c MOV %RAX,%RDX |
(3814) 0x4c499f MOV 0x88(%RBP),%RDI |
(3814) 0x4c49a6 MOV -0x50(%RBP),%RSI |
(3814) 0x4c49aa MOV -0x30(%RBP),%R10 |
(3814) 0x4c49ae MOV %RCX,%R14 |
(3814) 0x4c49b1 MOV 0x10(%RBP),%RAX |
(3814) 0x4c49b5 VMOVQ (%RAX,%RDX,8),%XMM0 |
(3814) 0x4c49ba VMOVQ %XMM0,(%RDI,%R12,8) |
(3814) 0x4c49c0 JMP 4c463b |
(3807) 0x4c49c5 MOVQ $0,-0x70(%RBP) |
(3807) 0x4c49cd TEST %R9,%R9 |
(3807) 0x4c49d0 JLE 4c4388 |
(3807) 0x4c49d6 LEA -0x1(%R9),%RAX |
(3807) 0x4c49da MOV %R13D,%EDX |
(3807) 0x4c49dd AND $0x7f,%EDX |
(3807) 0x4c49e0 MOV $0x80,%ECX |
(3807) 0x4c49e5 SUB %EDX,%ECX |
(3807) 0x4c49e7 SHR $0x3,%ECX |
(3807) 0x4c49ea CMP %RCX,%R12 |
(3807) 0x4c49ed MOV %RCX,-0x78(%RBP) |
(3807) 0x4c49f1 MOV %RCX,%RDX |
(3807) 0x4c49f4 CMOVB %R12,%RDX |
(3807) 0x4c49f8 MOV %R12,%RCX |
(3807) 0x4c49fb SUB %RDX,%RCX |
(3807) 0x4c49fe MOV %RCX,-0x98(%RBP) |
(3807) 0x4c4a05 AND $-0x10,%RCX |
(3807) 0x4c4a09 LEA -0x1(%RCX),%R8 |
(3807) 0x4c4a0d LEA (%R13,%RDX,8),%R9 |
(3807) 0x4c4a12 MOV %RCX,-0x90(%RBP) |
(3807) 0x4c4a19 ADD %RDX,%RCX |
(3807) 0x4c4a1c MOV %RCX,-0xa0(%RBP) |
(3807) 0x4c4a23 MOVQ $0,-0x58(%RBP) |
(3807) 0x4c4a2b MOV %R12,%R14 |
(3807) 0x4c4a2e XOR %R11D,%R11D |
(3807) 0x4c4a31 JMP 4c4a7c |
0x4c4a33 NOPW %CS:(%RAX,%RAX,1) |
(3824) 0x4c4a40 MOV -0x70(%RBP),%RDI |
(3824) 0x4c4a44 MOV -0x58(%RBP),%RCX |
(3824) 0x4c4a48 MOV %RSI,(%RDI,%RCX,8) |
(3824) 0x4c4a4c MOV -0x88(%RBP),%RSI |
(3824) 0x4c4a53 LEA (%RSI,%RCX,8),%RSI |
(3824) 0x4c4a57 INC %RCX |
(3824) 0x4c4a5a MOV %RCX,-0x58(%RBP) |
(3824) 0x4c4a5e MOV 0x10(%RBP),%RDI |
(3824) 0x4c4a62 VMOVQ (%RDI,%R10,8),%XMM0 |
(3824) 0x4c4a68 VMOVQ %XMM0,(%RSI) |
(3824) 0x4c4a6c LEA 0x1(%R11),%RSI |
(3824) 0x4c4a70 CMP %RAX,%R11 |
(3824) 0x4c4a73 MOV %RSI,%R11 |
(3824) 0x4c4a76 JE 4c4b8e |
(3824) 0x4c4a7c TEST %R12,%R12 |
(3824) 0x4c4a7f JLE 4c4b30 |
(3824) 0x4c4a85 MOV -0x60(%RBP),%RSI |
(3824) 0x4c4a89 LEA (%RSI,%R11,1),%R10 |
(3824) 0x4c4a8d MOV (%RBX,%R10,8),%RDI |
(3824) 0x4c4a91 TEST %RDX,%RDX |
(3824) 0x4c4a94 JE 4c4ab3 |
(3824) 0x4c4a96 XOR %ESI,%ESI |
(3824) 0x4c4a98 NOPL (%RAX,%RAX,1) |
(3827) 0x4c4aa0 CMP %RDI,(%R13,%RSI,8) |
(3827) 0x4c4aa5 JE 4c4b81 |
(3827) 0x4c4aab INC %RSI |
(3827) 0x4c4aae CMP %RSI,%RDX |
(3827) 0x4c4ab1 JNE 4c4aa0 |
(3824) 0x4c4ab3 CMP -0x78(%RBP),%R12 |
(3824) 0x4c4ab7 JBE 4c4b30 |
(3824) 0x4c4ab9 CMPQ $0,-0x90(%RBP) |
(3824) 0x4c4ac1 JE 4c4b06 |
(3824) 0x4c4ac3 VPBROADCASTQ %RDI,%YMM0 |
(3824) 0x4c4ac9 XOR %ESI,%ESI |
(3824) 0x4c4acb NOPL (%RAX,%RAX,1) |
(3826) 0x4c4ad0 VPCMPEQQ 0x20(%R9,%RSI,8),%YMM0,%K0 |
(3826) 0x4c4ad8 VPCMPEQQ (%R9,%RSI,8),%YMM0,%K1 |
(3826) 0x4c4adf VPCMPEQQ 0x60(%R9,%RSI,8),%YMM0,%K2 |
(3826) 0x4c4ae7 VPCMPEQQ 0x40(%R9,%RSI,8),%YMM0,%K3 |
(3826) 0x4c4aef KORB %K0,%K1,%K4 |
(3826) 0x4c4af3 KORB %K2,%K3,%K5 |
(3826) 0x4c4af7 KORTESTB %K5,%K4 |
(3826) 0x4c4afb JNE 4c4b5b |
(3826) 0x4c4afd ADD $0x10,%RSI |
(3826) 0x4c4b01 CMP %R8,%RSI |
(3826) 0x4c4b04 JBE 4c4ad0 |
(3824) 0x4c4b06 MOV -0x90(%RBP),%RCX |
(3824) 0x4c4b0d CMP -0x98(%RBP),%RCX |
(3824) 0x4c4b14 JAE 4c4b30 |
(3824) 0x4c4b16 MOV -0xa0(%RBP),%RSI |
(3824) 0x4c4b1d NOPL (%RAX) |
(3825) 0x4c4b20 CMP %RDI,(%R13,%RSI,8) |
(3825) 0x4c4b25 JE 4c4b81 |
(3825) 0x4c4b27 INC %RSI |
(3825) 0x4c4b2a CMP %RSI,%R12 |
(3825) 0x4c4b2d JNE 4c4b20 |
(3824) 0x4c4b2f NOP |
(3824) 0x4c4b30 MOV -0x60(%RBP),%RSI |
(3824) 0x4c4b34 LEA (%RSI,%R11,1),%R10 |
(3824) 0x4c4b38 MOV (%RBX,%R10,8),%RSI |
(3824) 0x4c4b3c CMP -0x80(%RBP),%R14 |
(3824) 0x4c4b40 JGE 4c4a40 |
(3824) 0x4c4b46 MOV %RSI,(%R13,%R14,8) |
(3824) 0x4c4b4b MOV -0x48(%RBP),%RCX |
(3824) 0x4c4b4f LEA (%RCX,%R14,8),%RSI |
(3824) 0x4c4b53 INC %R14 |
(3824) 0x4c4b56 JMP 4c4a5e |
(3824) 0x4c4b5b KSHIFTLB $0x4,%K0,%K0 |
(3824) 0x4c4b61 KORB %K0,%K1,%K0 |
(3824) 0x4c4b65 KSHIFTLB $0x4,%K2,%K1 |
(3824) 0x4c4b6b KORB %K1,%K3,%K1 |
(3824) 0x4c4b6f KUNPCKBW %K0,%K1,%K0 |
(3824) 0x4c4b73 KMOVD %K0,%EDI |
(3824) 0x4c4b77 TZCNT %EDI,%EDI |
(3824) 0x4c4b7b ADD %RDX,%RSI |
(3824) 0x4c4b7e ADD %RDI,%RSI |
(3824) 0x4c4b81 MOV -0x48(%RBP),%RCX |
(3824) 0x4c4b85 LEA (%RCX,%RSI,8),%RSI |
(3824) 0x4c4b89 JMP 4c4a5e |
(3807) 0x4c4b8e MOV -0x60(%RBP),%RAX |
(3807) 0x4c4b92 ADD -0x50(%RBP),%RAX |
(3807) 0x4c4b96 MOV -0x58(%RBP),%RSI |
(3807) 0x4c4b9a LEA (%R14,%RSI,1),%R12 |
(3807) 0x4c4b9e MOV 0x48(%RBP),%RCX |
(3807) 0x4c4ba2 MOV -0x30(%RBP),%RDX |
(3807) 0x4c4ba6 MOV %R12,(%RCX,%RDX,8) |
(3807) 0x4c4baa TEST %RSI,%RSI |
(3807) 0x4c4bad MOV %RAX,-0x60(%RBP) |
(3807) 0x4c4bb1 JE 4c4cb6 |
(3807) 0x4c4bb7 MOV 0x38(%RBP),%RAX |
(3807) 0x4c4bbb MOV (%RAX,%RDX,8),%RDI |
(3807) 0x4c4bbf LEA (,%R12,8),%R13 |
(3807) 0x4c4bc7 MOV %R13,%RSI |
(3807) 0x4c4bca VZEROUPPER |
(3807) 0x4c4bcd CALL 4d56b0 <hypre_ReAlloc> |
(3807) 0x4c4bd2 MOV -0x30(%RBP),%RCX |
(3807) 0x4c4bd6 MOV 0x38(%RBP),%RDX |
(3807) 0x4c4bda MOV %RAX,(%RDX,%RCX,8) |
(3807) 0x4c4bde MOV 0x40(%RBP),%RCX |
(3807) 0x4c4be2 MOV -0x30(%RBP),%RAX |
(3807) 0x4c4be6 MOV (%RCX,%RAX,8),%RDI |
(3807) 0x4c4bea MOV %R13,%RSI |
(3807) 0x4c4bed CALL 4d56b0 <hypre_ReAlloc> |
(3807) 0x4c4bf2 MOV -0x58(%RBP),%RDX |
(3807) 0x4c4bf6 MOV -0x30(%RBP),%RSI |
(3807) 0x4c4bfa MOV 0x40(%RBP),%RCX |
(3807) 0x4c4bfe MOV %RAX,(%RCX,%RSI,8) |
(3807) 0x4c4c02 MOV 0x50(%RBP),%RCX |
(3807) 0x4c4c06 MOV %R12,(%RCX,%RSI,8) |
(3807) 0x4c4c0a TEST %RDX,%RDX |
(3807) 0x4c4c0d JLE 4c4cb6 |
(3807) 0x4c4c13 MOV 0x38(%RBP),%RCX |
(3807) 0x4c4c17 MOV (%RCX,%RSI,8),%RCX |
(3807) 0x4c4c1b MOV -0x70(%RBP),%R13 |
(3807) 0x4c4c1f LEA -0x8(%R13,%RDX,8),%RSI |
(3807) 0x4c4c24 LEA (%RCX,%R14,8),%RDI |
(3807) 0x4c4c28 CMP %RDI,%RSI |
(3807) 0x4c4c2b SETAE %R9B |
(3807) 0x4c4c2f LEA -0x8(%RCX,%R12,8),%RCX |
(3807) 0x4c4c34 CMP %R13,%RCX |
(3807) 0x4c4c37 SETAE %SIL |
(3807) 0x4c4c3b MOV -0x88(%RBP),%R8 |
(3807) 0x4c4c42 LEA -0x8(%R8,%RDX,8),%RCX |
(3807) 0x4c4c47 LEA (%RAX,%R14,8),%R10 |
(3807) 0x4c4c4b CMP %R10,%RCX |
(3807) 0x4c4c4e SETB %CL |
(3807) 0x4c4c51 LEA -0x8(%RAX,%R12,8),%RAX |
(3807) 0x4c4c56 CMP %R8,%RAX |
(3807) 0x4c4c59 SETB %AL |
(3807) 0x4c4c5c TEST %SIL,%R9B |
(3807) 0x4c4c5f JNE 4c4cf0 |
(3807) 0x4c4c65 OR %AL,%CL |
(3807) 0x4c4c67 JE 4c4cf0 |
(3807) 0x4c4c6d CMP $0xd,%RDX |
(3807) 0x4c4c71 JAE 4c4271 |
(3807) 0x4c4c77 MOV %RDX,%RAX |
(3807) 0x4c4c7a AND $-0x4,%RAX |
(3807) 0x4c4c7e JE 4c4ddc |
(3807) 0x4c4c84 LEA -0x1(%RAX),%RCX |
(3807) 0x4c4c88 XOR %ESI,%ESI |
(3807) 0x4c4c8a NOPW (%RAX,%RAX,1) |
(3823) 0x4c4c90 VMOVUPS (%R13,%RSI,8),%YMM0 |
(3823) 0x4c4c97 VMOVUPS %YMM0,(%RDI,%RSI,8) |
(3823) 0x4c4c9c VMOVDQU (%R8,%RSI,8),%YMM0 |
(3823) 0x4c4ca2 VMOVDQU %YMM0,(%R10,%RSI,8) |
(3823) 0x4c4ca8 ADD $0x4,%RSI |
(3823) 0x4c4cac CMP %RCX,%RSI |
(3823) 0x4c4caf JLE 4c4c90 |
(3807) 0x4c4cb1 JMP 4c4de0 |
(3807) 0x4c4cb6 MOV -0x70(%RBP),%R13 |
(3807) 0x4c4cba TEST %R13,%R13 |
(3807) 0x4c4cbd JNE 4c4296 |
(3807) 0x4c4cc3 JMP 4c42b8 |
(3807) 0x4c4cc8 MOV %R14,%R9 |
(3807) 0x4c4ccb JMP 4c4dc0 |
(3807) 0x4c4cd0 MOV -0x98(%RBP),%RAX |
(3807) 0x4c4cd7 MOV %RAX,-0x60(%RBP) |
(3807) 0x4c4cdb MOV -0x38(%RBP),%RDX |
(3807) 0x4c4cdf MOV -0x68(%RBP),%RSI |
(3807) 0x4c4ce3 MOV -0x40(%RBP),%RDI |
(3807) 0x4c4ce7 MOV 0x20(%RBP),%R8 |
(3807) 0x4c4ceb JMP 4c4db8 |
(3807) 0x4c4cf0 XOR %EAX,%EAX |
(3807) 0x4c4cf2 NOPW %CS:(%RAX,%RAX,1) |
(3821) 0x4c4d00 MOV (%R13,%RAX,8),%RCX |
(3821) 0x4c4d05 MOV %RCX,(%RDI,%RAX,8) |
(3821) 0x4c4d09 VMOVQ (%R8,%RAX,8),%XMM0 |
(3821) 0x4c4d0f VMOVQ %XMM0,(%R10,%RAX,8) |
(3821) 0x4c4d15 INC %RAX |
(3821) 0x4c4d18 CMP %RAX,%RDX |
(3821) 0x4c4d1b JNE 4c4d00 |
(3807) 0x4c4d1d JMP 4c4296 |
(3807) 0x4c4d22 MOV %RDX,-0x60(%RBP) |
(3807) 0x4c4d26 MOV -0x58(%RBP),%R14 |
(3807) 0x4c4d2a MOV $0x4f4b43,%EDI |
(3807) 0x4c4d2f MOV $0xd70,%ESI |
(3807) 0x4c4d34 MOV $0x1,%EDX |
(3807) 0x4c4d39 XOR %ECX,%ECX |
(3807) 0x4c4d3b VZEROUPPER |
(3807) 0x4c4d3e CALL 4d8210 <hypre_error_handler> |
(3807) 0x4c4d43 MOV 0xd0(%RBP),%RAX |
(3807) 0x4c4d4a LOCK INCQ (%RAX) |
(3807) 0x4c4d4e MOV $0x4f4cc5,%EDI |
(3807) 0x4c4d53 CMPQ $0,0xc0(%RBP) |
(3807) 0x4c4d5b JNE 4c4d9a |
(3807) 0x4c4d5d JMP 4c4da4 |
(3807) 0x4c4d5f MOV %RDX,-0x60(%RBP) |
(3807) 0x4c4d63 MOV -0x58(%RBP),%R14 |
(3807) 0x4c4d67 MOV $0x4f4b43,%EDI |
(3807) 0x4c4d6c MOV $0xd4e,%ESI |
(3807) 0x4c4d71 MOV $0x1,%EDX |
(3807) 0x4c4d76 XOR %ECX,%ECX |
(3807) 0x4c4d78 VZEROUPPER |
(3807) 0x4c4d7b CALL 4d8210 <hypre_error_handler> |
(3807) 0x4c4d80 MOV 0xd0(%RBP),%RAX |
(3807) 0x4c4d87 LOCK INCQ (%RAX) |
(3807) 0x4c4d8b MOV $0x4f4c9f,%EDI |
(3807) 0x4c4d90 CMPQ $0,0xc0(%RBP) |
(3807) 0x4c4d98 JE 4c4da4 |
(3807) 0x4c4d9a MOV %R14,%RSI |
(3807) 0x4c4d9d XOR %EAX,%EAX |
(3807) 0x4c4d9f CALL 4d5800 <hypre_printf> |
(3807) 0x4c4da4 MOV -0x38(%RBP),%RDX |
(3807) 0x4c4da8 MOV -0x68(%RBP),%RSI |
(3807) 0x4c4dac MOV -0x40(%RBP),%RDI |
(3807) 0x4c4db0 MOV 0x20(%RBP),%R8 |
(3807) 0x4c4db4 MOV -0x30(%RBP),%R10 |
(3807) 0x4c4db8 MOV -0x48(%RBP),%R9 |
(3807) 0x4c4dbc MOV -0x78(%RBP),%R11 |
(3807) 0x4c4dc0 MOV 0x18(%RBP),%RAX |
(3807) 0x4c4dc4 MOV (%RAX),%RAX |
(3807) 0x4c4dc7 MOV 0x38(%RAX),%RCX |
(3807) 0x4c4dcb MOV %R11,(%RCX,%R10,8) |
(3807) 0x4c4dcf MOV 0x40(%RAX),%RAX |
(3807) 0x4c4dd3 MOV %R9,(%RAX,%R10,8) |
(3807) 0x4c4dd7 JMP 4c42c8 |
(3807) 0x4c4ddc XOR %EAX,%EAX |
(3807) 0x4c4dde JMP 4c4de9 |
(3822) 0x4c4de0 CMP %RAX,%RDX |
(3822) 0x4c4de3 JE 4c4296 |
(3822) 0x4c4de9 MOV (%R13,%RAX,8),%RCX |
(3822) 0x4c4dee MOV %RCX,(%RDI,%RAX,8) |
(3822) 0x4c4df2 VMOVQ (%R8,%RAX,8),%XMM0 |
(3822) 0x4c4df8 VMOVQ %XMM0,(%R10,%RAX,8) |
(3822) 0x4c4dfe INC %RAX |
(3822) 0x4c4e01 JMP 4c4de0 |
0x4c4e03 ADD $0x98,%RSP |
0x4c4e0a POP %RBX |
0x4c4e0b POP %R12 |
0x4c4e0d POP %R13 |
0x4c4e0f POP %R14 |
0x4c4e11 POP %R15 |
0x4c4e13 POP %RBP |
0x4c4e14 VZEROUPPER |
0x4c4e17 RET |
0x4c4e18 NOPL (%RAX,%RAX,1) |
Path / |
Source file and lines | IJMatrix_parcsr.c:3240-3484 |
Module | exec |
nb instructions | 165 |
nb uops | 178 |
loop length | 684 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 13 |
micro-operation queue | 29.67 cycles |
front end | 29.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 12.00 | 12.00 | 9.33 | 9.33 | 10.00 | 12.00 | 12.00 | 10.00 | 10.00 | 10.00 | 12.00 | 9.33 |
cycles | 12.00 | 16.80 | 9.33 | 9.33 | 10.00 | 12.00 | 12.00 | 10.00 | 10.00 | 10.00 | 12.00 | 9.33 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 28.34-28.39 |
Stall cycles | 0.00 |
Front-end | 29.67 |
Dispatch | 16.80 |
DIV/SQRT | 16.00 |
Overall L1 | 29.67 |
all | 17% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 21% |
all | 13% |
load | 12% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d7300 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d7310 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4c401e <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x4e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R13 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4c4026 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x56> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R13D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xb8(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R14),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c404e <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x7e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%RAX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
IMUL %RCX,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 4c4062 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x92> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVQ $0,(%R15,%R14,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c413f <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x16f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R15,%R14,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x8(%RSI,%R8,8),%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %R14,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RDX,%RAX,1),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RSI,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c40c1 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xf1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RDI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c40c1 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xf1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4c413f <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x16f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4c4116 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x146> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RSI),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%RDI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4c4122 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x152> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4c413c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x16c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719570,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4c41f4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x224> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c41f4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x224> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c41c7 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x1f7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R15),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x40(%R15),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x8,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4c41f4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x224> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R15,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719590,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4c4212 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x242> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x8(%R15,%R14,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c421a <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x24a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOVQ $0,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c4e03 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xe33> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x98(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RAX,%R14,8),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x1,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x18(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c42d4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x304> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | IJMatrix_parcsr.c:3240-3484 |
Module | exec |
nb instructions | 165 |
nb uops | 178 |
loop length | 684 |
used x86 registers | 15 |
used mmx registers | 0 |
used xmm registers | 2 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 13 |
micro-operation queue | 29.67 cycles |
front end | 29.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 12.00 | 12.00 | 9.33 | 9.33 | 10.00 | 12.00 | 12.00 | 10.00 | 10.00 | 10.00 | 12.00 | 9.33 |
cycles | 12.00 | 16.80 | 9.33 | 9.33 | 10.00 | 12.00 | 12.00 | 10.00 | 10.00 | 10.00 | 12.00 | 9.33 |
Cycles executing div or sqrt instructions | 16.00 |
FE+BE cycles | 28.34-28.39 |
Stall cycles | 0.00 |
Front-end | 29.67 |
Dispatch | 16.80 |
DIV/SQRT | 16.00 |
Overall L1 | 29.67 |
all | 17% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 100% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 21% |
all | 13% |
load | 12% |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 25% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 9% |
other | 14% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R8,-0xa8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDX,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d7300 <hypre_NumActiveThreads> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 4d7310 <hypre_GetThreadNum> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %RAX,%R14 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
OR %R15,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x20,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
JE 4c401e <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x4e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R15,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CQTO | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R13 | 5 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 10 |
JMP 4c4026 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x56> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %R15D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
DIV %R13D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0xb8(%RBP),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R14),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RDX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c404e <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x7e> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA 0x1(%RAX),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
IMUL %RCX,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
JMP 4c4062 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x92> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
IMUL %R14,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVQ $0,(%R15,%R14,8) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CMP %R8,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 4c413f <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x16f> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA (%R15,%R14,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA -0x8(%RSI,%R8,8),%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
CMP %RDX,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVL %R14,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IMUL %R14,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (%RDX,%RAX,1),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RDI,%RSI,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CMP %RCX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c40c1 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xf1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP %RDI,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c40c1 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xf1> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
XOR %EAX,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R12,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x38(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JMP 4c413f <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x16f> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOV -0x40(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x4,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
JE 4c4116 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x146> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
LEA -0x1(%RSI),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPXOR %XMM0,%XMM0,%XMM0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R10D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VEXTRACTI128 $0x1,%YMM0,%XMM1 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VPSHUFD $-0x12,%XMM0,%XMM1 | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
VPADDQ %XMM1,%XMM0,%XMM0 | 1 | 0.33 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
VMOVQ %XMM0,%RDI | 1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
CMP %RSI,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
JNE 4c4122 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x152> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
JMP 4c413c <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x16c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV -0x38(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV -0x40(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,(%RCX) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719570,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JNE 4c41f4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x224> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xc8(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 4c41f4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x224> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
CMP $0x8,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JB 4c41c7 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x1f7> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SHR $0x3,%RCX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV (%R15),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x40(%R15),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x8,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP %RAX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JAE 4c41f4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x224> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV (%R15,%RCX,8),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV (%R13),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x719590,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 40fed0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
TEST %R14,%R14 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JE 4c4212 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x242> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x8(%R15,%R14,8),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c421a <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x24a> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
MOVQ $0,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV -0x38(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV -0x40(%RBP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RDI,%R12 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 4c4e03 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0xe33> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV 0xb0(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x98(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RAX,%R14,8),%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA -0x1(%R8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x1,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RAX,-0xb8(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x18(%RCX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,-0xb0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVQ $0,-0x88(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 4c42d4 <hypre_IJMatrixSetValuesOMPParCSR.extracted.28+0x304> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x98,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_IJMatrixSetValuesOMPParCSR.extracted.28– | 0.81 | 0.13 |
▼Loop 3807 - IJMatrix_parcsr.c:3262-3484 - exec– | 0.09 | 0.01 |
▼Loop 3814 - IJMatrix_parcsr.c:3262-3454 - exec– | 0.71 | 0.1 |
○Loop 3820 - IJMatrix_parcsr.c:3422-3424 - exec | 0 | 0 |
○Loop 3818 - IJMatrix_parcsr.c:3422-3424 - exec | 0 | 0 |
○Loop 3816 - IJMatrix_parcsr.c:3388-3424 - exec | 0 | 0 |
○Loop 3819 - IJMatrix_parcsr.c:3422-3424 - exec | 0 | 0 |
○Loop 3817 - IJMatrix_parcsr.c:3388-3390 - exec | 0 | 0 |
○Loop 3815 - IJMatrix_parcsr.c:3388-3390 - exec | 0 | 0 |
▼Loop 3808 - IJMatrix_parcsr.c:3262-3484 - exec– | 0 | 0 |
▼Loop 3809 - IJMatrix_parcsr.c:3475-3484 - exec– | 0 | 0 |
○Loop 3810 - IJMatrix_parcsr.c:3478-3484 - exec | 0 | 0 |
▼Loop 3811 - IJMatrix_parcsr.c:3475-3484 - exec– | 0 | 0 |
○Loop 3812 - IJMatrix_parcsr.c:3478-3484 - exec | 0 | 0 |
○Loop 3813 - IJMatrix_parcsr.c:3478-3484 - exec | 0 | 0 |
○Loop 3822 - IJMatrix_parcsr.c:3359-3458 - exec | 0 | 0 |
○Loop 3821 - IJMatrix_parcsr.c:3359-3362 - exec | 0 | 0 |
○Loop 3823 - IJMatrix_parcsr.c:3359-3362 - exec | 0 | 0 |
▼Loop 3824 - IJMatrix_parcsr.c:3262-3337 - exec– | 0 | 0 |
○Loop 3825 - IJMatrix_parcsr.c:3318-3320 - exec | 0 | 0 |
○Loop 3826 - IJMatrix_parcsr.c:3318-3320 - exec | 0 | 0 |
○Loop 3827 - IJMatrix_parcsr.c:3318-3320 - exec | 0 | 0 |
○Loop 3828 - IJMatrix_parcsr.c:3282-3283 - exec | 0 | 0 |
○Loop 3831 - IJMatrix_parcsr.c:3274-3275 - exec | 0 | 0 |
○Loop 3829 - IJMatrix_parcsr.c:3282-3283 - exec | 0 | 0 |
○Loop 3832 - IJMatrix_parcsr.c:3274-3275 - exec | 0 | 0 |
○Loop 3830 - IJMatrix_parcsr.c:3274-3275 - exec | 0 | 0 |