NuSiF-Solver/PoissonSolver/2D-mpi/ICC/solver.s

4207 lines
262 KiB
ArmAsm
Raw Normal View History

2024-01-08 22:32:30 +01:00
# mark_description "Intel(R) C Intel(R) 64 Compiler Classic for applications running on Intel(R) 64, Version 2021.10.0 Build 202";
# mark_description "30609_000000";
# mark_description "-I./src/includes -I./ICC -I/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-mpi-2021.1";
# mark_description "0.0-ki6gcj4pr5rekayazvm4lsmvcyosce25/mpi/2021.10.0/include -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux";
# mark_description "8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux";
# mark_description "/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-ax";
# mark_description "ze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/x64 -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almal";
# mark_description "inux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/l";
# mark_description "inux/lib/oclfpga/host/linux64/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel";
# mark_description "-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/oclfpga/linux64/lib ";
# mark_description "-Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7oc";
# mark_description "bc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/compiler/lib/intel64_lin -gcc-name=/usr/bin/gcc -gxx-name=";
# mark_description "/usr/bin/g++ -S -fverbose-asm -D_GNU_SOURCE -DARRAY_ALIGNMENT=64 -O3 -xHost -qopt-zmm-usage=high -std=c99 -o";
# mark_description " ICC/solver.s";
.file "solver.c"
.text
..TXTST0:
.L_2__routine_start_getResult_0:
# -- Begin getResult
.text
# mark_begin;
.align 16,0x90
.globl getResult
# --- getResult(Solver *)
getResult:
# parameter 1: %rdi
..B1.1: # Preds ..B1.0
# Execution count [1.00e+00]
.cfi_startproc
..___tag_value_getResult.1:
..L2:
#73.1
pushq %rbp #73.1
.cfi_def_cfa_offset 16
movq %rsp, %rbp #73.1
.cfi_def_cfa 6, 16
.cfi_offset 6, -16
andq $-64, %rsp #73.1
pushq %r12 #73.1
pushq %r13 #73.1
pushq %r14 #73.1
pushq %r15 #73.1
pushq %rbx #73.1
subq $88, %rsp #73.1
.cfi_escape 0x10, 0x03, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf0, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0f, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x22
movq %rdi, %r13 #73.1
xorl %r12d, %r12d #74.18
cmpl $0, 36(%r13) #77.25
je ..B1.21 # Prob 5% #77.25
# LOE rbx r9 r12 r13
..B1.2: # Preds ..B1.1
# Execution count [9.50e-01]
movl 24(%r13), %esi #93.39
movl 32(%r13), %r15d #92.26
# LOE rbx r9 r12 r13 esi r15d
..B1.3: # Preds ..B1.24 ..B1.46 ..B1.45 ..B1.2
# Execution count [1.00e+00]
movslq %esi, %rsi #94.5
addq $-32, %rsp #94.5
movq 48(%r13), %rax #94.5
movl $1275070475, %edx #94.5
movq %r12, %rcx #94.5
movq %rbx, %r8 #94.5
movl $1275070475, (%rsp) #94.5
lea 16(%rax,%rsi,8), %rdi #94.5
addl $2, %esi #94.5
imull %r15d, %esi #94.5
movl $0, 8(%rsp) #94.5
movl $1140850688, 16(%rsp) #94.5
vzeroupper #94.5
..___tag_value_getResult.11:
# MPI_Gatherv(const void *, int, MPI_Datatype, void *, const int *, const int *, MPI_Datatype, int, MPI_Comm)
call MPI_Gatherv #94.5
..___tag_value_getResult.12:
# LOE r12 r13
..B1.51: # Preds ..B1.3
# Execution count [1.00e+00]
addq $32, %rsp #94.5
# LOE r12 r13
..B1.4: # Preds ..B1.51
# Execution count [1.00e+00]
cmpl $0, 36(%r13) #104.25
jne ..B1.18 # Prob 78% #104.25
# LOE r12 r13
..B1.5: # Preds ..B1.4
# Execution count [2.20e-01]
movl $.L_2__STRING.4, %edi #105.9
movl $.L_2__STRING.9, %esi #105.9
movl 24(%r13), %ebx #105.9
movl 28(%r13), %r15d #105.9
# fopen(const char *__restrict__, const char *__restrict__)
call fopen #105.9
# LOE rax r12 ebx r15d
..B1.6: # Preds ..B1.5
# Execution count [2.20e-01]
testq %rax, %rax #105.9
je ..B1.19 # Prob 0% #105.9
# LOE rax r12 ebx r15d
..B1.7: # Preds ..B1.6
# Execution count [2.18e-01]
addl $2, %r15d #105.9
xorl %edx, %edx #105.9
testl %r15d, %r15d #105.9
jle ..B1.17 # Prob 10% #105.9
# LOE rax r12 edx ebx r15d
..B1.8: # Preds ..B1.7
# Execution count [1.97e-01]
movslq %ebx, %rsi #105.9
lea 2(%rbx), %r13d #105.9
addq $2, %rsi #105.9
xorl %r14d, %r14d #105.9
movq %rsi, 24(%rsp) #105.9[spill]
movl %r15d, 40(%rsp) #105.9[spill]
movl %edx, %r15d #105.9
movq %r12, 32(%rsp) #105.9[spill]
movq %rax, %r12 #105.9
# LOE r12 ebx r13d r14d r15d
..B1.9: # Preds ..B1.15 ..B1.8
# Execution count [1.09e+00]
xorl %edx, %edx #105.9
testl %r13d, %r13d #105.9
jle ..B1.14 # Prob 10% #105.9
# LOE rdx r12 ebx r13d r14d r15d
..B1.10: # Preds ..B1.9
# Execution count [9.83e-01]
movslq %r14d, %r14 #105.9
movq 32(%rsp), %rcx #105.9[spill]
movl %r15d, 8(%rsp) #105.9[spill]
movl %r13d, 16(%rsp) #105.9[spill]
movq %rdx, %r13 #105.9
movl %ebx, (%rsp) #105.9[spill]
lea (%rcx,%r14,8), %rax #105.9
movq 24(%rsp), %r15 #105.9[spill]
movq %rax, %rbx #105.9
# LOE rbx r12 r13 r15 r14d
..B1.11: # Preds ..B1.12 ..B1.10
# Execution count [5.46e+00]
movq %r12, %rdi #105.9
movl $.L_2__STRING.11, %esi #105.9
movl $1, %eax #105.9
vmovsd (%rbx,%r13,8), %xmm0 #105.9
# fprintf(FILE *__restrict__, const char *__restrict__, ...)
call fprintf #105.9
# LOE rbx r12 r13 r15 r14d
..B1.12: # Preds ..B1.11
# Execution count [5.46e+00]
incq %r13 #105.9
cmpq %r15, %r13 #105.9
jl ..B1.11 # Prob 82% #105.9
# LOE rbx r12 r13 r15 r14d
..B1.13: # Preds ..B1.12
# Execution count [9.83e-01]
movl 16(%rsp), %r13d #[spill]
movl 8(%rsp), %r15d #[spill]
movl (%rsp), %ebx #[spill]
# LOE r12 ebx r13d r14d r15d
..B1.14: # Preds ..B1.9 ..B1.13
# Execution count [1.09e+00]
movl $10, %edi #105.9
movq %r12, %rsi #105.9
call fputc #105.9
# LOE r12 ebx r13d r14d r15d
..B1.15: # Preds ..B1.14
# Execution count [1.09e+00]
incl %r15d #105.9
lea 2(%r14,%rbx), %r14d #105.9
cmpl 40(%rsp), %r15d #105.9[spill]
jl ..B1.9 # Prob 82% #105.9
# LOE r12 ebx r13d r14d r15d
..B1.16: # Preds ..B1.15
# Execution count [1.97e-01]
movq %r12, %rax #
# LOE rax
..B1.17: # Preds ..B1.7 ..B1.16
# Execution count [2.18e-01]
movq %rax, %rdi #105.9
addq $88, %rsp #105.9
.cfi_restore 3
popq %rbx #105.9
.cfi_restore 15
popq %r15 #105.9
.cfi_restore 14
popq %r14 #105.9
.cfi_restore 13
popq %r13 #105.9
.cfi_restore 12
popq %r12 #105.9
movq %rbp, %rsp #105.9
popq %rbp #105.9
.cfi_def_cfa 7, 8
.cfi_restore 6
# fclose(FILE *)
jmp fclose #105.9
.cfi_def_cfa 6, 16
.cfi_escape 0x10, 0x03, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd8, 0xff, 0xff, 0xff, 0x22
.cfi_offset 6, -16
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf0, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0f, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x22
# LOE
..B1.18: # Preds ..B1.4
# Execution count [1.00e+00]
addq $88, %rsp #107.1
.cfi_restore 3
popq %rbx #107.1
.cfi_restore 15
popq %r15 #107.1
.cfi_restore 14
popq %r14 #107.1
.cfi_restore 13
popq %r13 #107.1
.cfi_restore 12
popq %r12 #107.1
movq %rbp, %rsp #107.1
popq %rbp #107.1
.cfi_def_cfa 7, 8
.cfi_restore 6
ret #107.1
.cfi_def_cfa 6, 16
.cfi_escape 0x10, 0x03, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd8, 0xff, 0xff, 0xff, 0x22
.cfi_offset 6, -16
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf0, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0f, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x22
# LOE
..B1.19: # Preds ..B1.6
# Execution count [1.57e-03]: Infreq
movl $il0_peep_printf_format_0, %edi #105.9
call puts #105.9
# LOE
..B1.20: # Preds ..B1.19
# Execution count [1.57e-03]: Infreq
movl $1, %edi #105.9
# exit(int)
call exit #105.9
# LOE
..B1.21: # Preds ..B1.1
# Execution count [5.00e-02]: Infreq
movl 28(%r13), %eax #78.16
movl $64, %edi #78.16
movl 24(%r13), %esi #78.16
addl $2, %eax #78.16
addl $2, %esi #78.16
imull %eax, %esi #78.16
movslq %esi, %rsi #78.16
shlq $3, %rsi #78.16
..___tag_value_getResult.53:
# allocate(int, size_t)
call allocate #78.16
..___tag_value_getResult.54:
# LOE rax r13
..B1.53: # Preds ..B1.21
# Execution count [5.00e-02]: Infreq
movq %rax, %r12 #78.16
# LOE r12 r13
..B1.22: # Preds ..B1.53
# Execution count [5.00e-02]: Infreq
movslq 40(%r13), %rdi #79.30
shlq $2, %rdi #79.30
# malloc(size_t)
call malloc #79.30
# LOE rax r12 r13
..B1.54: # Preds ..B1.22
# Execution count [5.00e-02]: Infreq
movq %rax, %rbx #79.30
# LOE rbx r12 r13
..B1.23: # Preds ..B1.54
# Execution count [5.00e-02]: Infreq
movslq 40(%r13), %rdi #80.30
shlq $2, %rdi #80.30
# malloc(size_t)
call malloc #80.30
# LOE rax rbx r12 r13
..B1.55: # Preds ..B1.23
# Execution count [5.00e-02]: Infreq
movq %rax, %r9 #80.30
# LOE rbx r9 r12 r13
..B1.24: # Preds ..B1.55
# Execution count [4.50e-02]: Infreq
movl 24(%r13), %esi #81.45
movl 32(%r13), %r15d #81.24
movl 40(%r13), %r8d #85.29
movl $0, (%r9) #82.9
lea 2(%rsi), %r14d #81.60
movl %r14d, %eax #81.60
imull %r15d, %eax #81.60
movl %eax, (%rsp) #81.60[spill]
movl %eax, (%rbx) #81.9
cmpl $1, %r8d #85.29
jle ..B1.3 # Prob 0% #85.29
# LOE rbx r9 r12 r13 esi r8d r14d r15d
..B1.25: # Preds ..B1.24
# Execution count [4.50e-02]: Infreq
movl 28(%r13), %r10d #86.56
lea -1(%r8), %ecx #85.29
cmpl $16, %ecx #85.9
jl ..B1.48 # Prob 10% #85.9
# LOE rbx r9 r12 r13 ecx esi r8d r10d r14d r15d
..B1.26: # Preds ..B1.25
# Execution count [4.50e-02]: Infreq
cmpl $123, %ecx #85.9
jl ..B1.47 # Prob 10% #85.9
# LOE rbx r9 r12 r13 ecx esi r8d r10d r14d r15d
..B1.27: # Preds ..B1.26
# Execution count [4.50e-02]: Infreq
lea 4(%rbx), %r11 #86.13
andq $63, %r11 #85.9
testl $3, %r11d #85.9
je ..B1.29 # Prob 50% #85.9
# LOE rbx r9 r12 r13 ecx esi r8d r10d r11d r14d r15d
..B1.28: # Preds ..B1.27
# Execution count [2.25e-02]: Infreq
xorl %r11d, %r11d #85.9
jmp ..B1.31 # Prob 100% #85.9
# LOE rbx r9 r12 r13 ecx esi r8d r10d r11d r14d r15d
..B1.29: # Preds ..B1.27
# Execution count [2.25e-02]: Infreq
testl %r11d, %r11d #85.9
je ..B1.31 # Prob 50% #85.9
# LOE rbx r9 r12 r13 ecx esi r8d r10d r11d r14d r15d
..B1.30: # Preds ..B1.29
# Execution count [2.50e-01]: Infreq
negl %r11d #85.9
addl $64, %r11d #85.9
shrl $2, %r11d #85.9
cmpl %r11d, %ecx #85.9
cmovl %ecx, %r11d #85.9
# LOE rbx r9 r12 r13 ecx esi r8d r10d r11d r14d r15d
..B1.31: # Preds ..B1.28 ..B1.30 ..B1.29
# Execution count [5.00e-02]: Infreq
movl %ecx, %edi #85.9
subl %r11d, %edi #85.9
andl $15, %edi #85.9
negl %edi #85.9
addl %ecx, %edi #85.9
vmovups .L_2il0floatpacket.0(%rip), %zmm7 #85.9
cmpl $1, %r11d #85.9
jb ..B1.35 # Prob 50% #85.9
# LOE rbx r9 r12 r13 ecx esi edi r8d r10d r11d r14d r15d zmm7
..B1.32: # Preds ..B1.31
# Execution count [4.50e-02]: Infreq
movl %r10d, %eax #86.28
cltd #86.28
vmovups .L_2il0floatpacket.2(%rip), %zmm6 #85.9
vmovups .L_2il0floatpacket.3(%rip), %zmm5 #86.13
vmovups .L_2il0floatpacket.1(%rip), %zmm1 #86.28
idivl %r8d #86.28
movq $0, 8(%rsp) #85.9[spill]
imull %r14d, %eax #86.88
vpbroadcastd %r14d, %zmm4 #86.88
vpbroadcastd %r11d, %zmm0 #85.9
vpbroadcastd %edx, %zmm2 #86.28
vpbroadcastd %eax, %zmm3 #86.88
movslq %r11d, %rdx #85.9
movq 8(%rsp), %rax #85.9[spill]
# LOE rax rdx rbx r9 r12 r13 ecx esi edi r8d r10d r11d r14d r15d zmm0 zmm1 zmm2 zmm3 zmm4 zmm5 zmm6 zmm7
..B1.33: # Preds ..B1.33 ..B1.32
# Execution count [2.50e-01]: Infreq
vpcmpgtd %zmm5, %zmm2, %k1 #86.28
vpcmpgtd %zmm6, %zmm0, %k2 #85.9
vpaddd %zmm7, %zmm6, %zmm6 #85.9
vpaddd %zmm7, %zmm5, %zmm5 #86.13
vmovdqa32 %zmm1, %zmm8{%k1}{z} #86.28
vpmulld %zmm8, %zmm4, %zmm9 #86.88
vpaddd %zmm9, %zmm3, %zmm10 #86.88
vmovdqu32 %zmm10, 4(%rbx,%rax,4){%k2} #86.13
addq $16, %rax #85.9
cmpq %rdx, %rax #85.9
jb ..B1.33 # Prob 82% #85.9
# LOE rax rdx rbx r9 r12 r13 ecx esi edi r8d r10d r11d r14d r15d zmm0 zmm1 zmm2 zmm3 zmm4 zmm5 zmm6 zmm7
..B1.34: # Preds ..B1.33
# Execution count [4.50e-02]: Infreq
cmpl %r11d, %ecx #85.9
je ..B1.41 # Prob 10% #85.9
# LOE rbx r9 r12 r13 ecx esi edi r8d r10d r11d r14d r15d zmm7
..B1.35: # Preds ..B1.31 ..B1.34 ..B1.47
# Execution count [2.50e-01]: Infreq
lea 1(%r11), %edx #86.13
vpbroadcastd %edx, %zmm0 #86.13
lea 16(%r11), %edx #85.9
vpaddd .L_2il0floatpacket.4(%rip), %zmm0, %zmm4 #86.13
cmpl %edx, %edi #85.9
jl ..B1.39 # Prob 50% #85.9
# LOE rbx r9 r12 r13 ecx esi edi r8d r10d r11d r14d r15d zmm4 zmm7
..B1.36: # Preds ..B1.35
# Execution count [4.50e-02]: Infreq
movslq %r11d, %r11 #85.9
movl %r10d, %eax #86.28
vpbroadcastd %r14d, %zmm3 #86.88
vmovups .L_2il0floatpacket.1(%rip), %zmm0 #86.28
lea (%rbx,%r11,4), %rdx #79.30
movq %rdx, 8(%rsp) #79.30[spill]
cltd #86.28
idivl %r8d #86.28
vpbroadcastd %edx, %zmm1 #86.28
imull %r14d, %eax #86.88
vpbroadcastd %eax, %zmm2 #86.88
movq 8(%rsp), %rdx #86.88[spill]
# LOE rdx rbx r9 r12 r13 ecx esi edi r8d r10d r11d r14d r15d zmm0 zmm1 zmm2 zmm3 zmm4 zmm7
..B1.37: # Preds ..B1.37 ..B1.36
# Execution count [2.50e-01]: Infreq
vpcmpgtd %zmm4, %zmm1, %k1 #86.28
addl $16, %r11d #85.9
vpaddd %zmm7, %zmm4, %zmm4 #86.13
vmovdqa32 %zmm0, %zmm5{%k1}{z} #86.28
vpmulld %zmm5, %zmm3, %zmm6 #86.88
vpaddd %zmm6, %zmm2, %zmm8 #86.88
vmovdqu32 %zmm8, 4(%rdx) #86.13
addq $64, %rdx #85.9
cmpl %edi, %r11d #85.9
jb ..B1.37 # Prob 82% #85.9
# LOE rdx rbx r9 r12 r13 ecx esi edi r8d r10d r11d r14d r15d zmm0 zmm1 zmm2 zmm3 zmm4 zmm7
..B1.39: # Preds ..B1.37 ..B1.35 ..B1.48
# Execution count [5.00e-02]: Infreq
lea 1(%rdi), %edx #85.9
cmpl %ecx, %edx #85.9
ja ..B1.41 # Prob 50% #85.9
# LOE rbx r9 r12 r13 edx ecx esi edi r8d r10d r14d r15d
..B1.40: # Preds ..B1.39
# Execution count [2.50e-01]: Infreq
movl %r10d, %eax #86.28
movl %ecx, %r10d #85.9
vpbroadcastd %edx, %zmm0 #86.13
subl %edi, %r10d #85.9
cltd #86.28
vpbroadcastd %r14d, %zmm3 #86.88
vpaddd .L_2il0floatpacket.4(%rip), %zmm0, %zmm2 #86.13
vpbroadcastd %r10d, %zmm7 #85.9
idivl %r8d #86.28
vpbroadcastd %edx, %zmm1 #86.28
imull %eax, %r14d #86.88
vpcmpgtd .L_2il0floatpacket.2(%rip), %zmm7, %k2 #85.9
vpcmpgtd %zmm2, %zmm1, %k1 #86.28
vpbroadcastd %r14d, %zmm5 #86.88
vmovdqu32 .L_2il0floatpacket.1(%rip), %zmm4{%k1}{z} #86.28
movslq %edi, %rdi #86.13
vpmulld %zmm4, %zmm3, %zmm6 #86.88
vpaddd %zmm6, %zmm5, %zmm8 #86.88
vmovdqu32 %zmm8, 4(%rbx,%rdi,4){%k2} #86.13
# LOE rbx r9 r12 r13 ecx esi r15d
..B1.41: # Preds ..B1.34 ..B1.39 ..B1.40
# Execution count [5.00e-02]: Infreq
movl %ecx, %eax #85.9
movl $1, %edi #85.9
xorl %edx, %edx #85.9
shrl $1, %eax #85.9
je ..B1.45 # Prob 10% #85.9
# LOE rax rdx rbx r9 r12 r13 ecx esi edi r15d
..B1.42: # Preds ..B1.41
# Execution count [4.50e-02]: Infreq
movl (%rsp), %r11d #85.9[spill]
# LOE rax rdx rbx r9 r12 r13 ecx esi r11d r15d
..B1.43: # Preds ..B1.43 ..B1.42
# Execution count [1.25e-01]: Infreq
movl 4(%rbx,%rdx,8), %edi #88.23
movl %r11d, 4(%r9,%rdx,8) #87.13
addl %edi, %r11d #88.13
movl %r11d, 8(%r9,%rdx,8) #87.13
movl 8(%rbx,%rdx,8), %r10d #88.23
incq %rdx #85.9
addl %r10d, %r11d #88.13
cmpq %rax, %rdx #85.9
jb ..B1.43 # Prob 64% #85.9
# LOE rax rdx rbx r9 r12 r13 ecx esi r11d r15d
..B1.44: # Preds ..B1.43
# Execution count [4.50e-02]: Infreq
movl %r11d, (%rsp) #[spill]
lea 1(%rdx,%rdx), %edi #86.13
# LOE rbx r9 r12 r13 ecx esi edi r15d
..B1.45: # Preds ..B1.44 ..B1.41
# Execution count [5.00e-02]: Infreq
lea -1(%rdi), %eax #85.9
cmpl %ecx, %eax #85.9
jae ..B1.3 # Prob 10% #85.9
# LOE rbx r9 r12 r13 esi edi r15d
..B1.46: # Preds ..B1.45
# Execution count [4.50e-02]: Infreq
movslq %edi, %rdi #86.13
movl (%rsp), %eax #87.13[spill]
movl %eax, (%r9,%rdi,4) #87.13
jmp ..B1.3 # Prob 100% #87.13
# LOE rbx r9 r12 r13 esi r15d
..B1.47: # Preds ..B1.26
# Execution count [4.50e-03]: Infreq
movl %ecx, %edi #85.9
xorl %r11d, %r11d #85.9
vmovups .L_2il0floatpacket.0(%rip), %zmm7 #86.13
andl $-16, %edi #85.9
jmp ..B1.35 # Prob 100% #85.9
# LOE rbx r9 r12 r13 ecx esi edi r8d r10d r11d r14d r15d zmm7
..B1.48: # Preds ..B1.25
# Execution count [4.50e-03]: Infreq
xorl %edi, %edi #85.9
jmp ..B1.39 # Prob 100% #85.9
.align 16,0x90
# LOE rbx r9 r12 r13 ecx esi edi r8d r10d r14d r15d
.cfi_endproc
# mark_end;
.type getResult,@function
.size getResult,.-getResult
..LNgetResult.0:
.section .rodata.str1.4, "aMS",@progbits,1
.align 4
.align 4
il0_peep_printf_format_0:
.long 1869771333
.word 8562
.byte 0
.data
# -- End getResult
.text
.L_2__routine_start_debug_1:
# -- Begin debug
.text
# mark_begin;
.align 16,0x90
.globl debug
# --- debug(Solver *)
debug:
# parameter 1: %rdi
..B2.1: # Preds ..B2.0
# Execution count [1.00e+00]
.cfi_startproc
..___tag_value_debug.64:
..L65:
#162.1
subq $72, %rsp #162.1
.cfi_def_cfa_offset 80
xorl %eax, %eax #187.16
movl 36(%rdi), %edx #164.17
cmpl $0, 40(%rdi) #187.25
jle ..B2.20 # Prob 10% #187.25
# LOE rbx rbp rdi r12 r13 r14 r15 eax edx
..B2.2: # Preds ..B2.1
# Execution count [9.00e-01]
movq %r12, (%rsp) #[spill]
.cfi_offset 12, -80
movl %eax, %r12d #
movq %r13, 8(%rsp) #[spill]
.cfi_offset 13, -72
movl %edx, %r13d #
movq %r14, 16(%rsp) #[spill]
movq %r15, 24(%rsp) #[spill]
movq %rbx, 32(%rsp) #[spill]
.cfi_offset 3, -48
.cfi_offset 14, -64
.cfi_offset 15, -56
movq %rdi, %rbx #
movq %rbp, 40(%rsp) #[spill]
.cfi_offset 6, -40
# LOE rbx r12d r13d
..B2.3: # Preds ..B2.18 ..B2.2
# Execution count [5.00e+00]
cmpl %r13d, %r12d #188.18
jne ..B2.17 # Prob 78% #188.18
# LOE rbx r12d r13d
..B2.4: # Preds ..B2.3
# Execution count [1.10e+00]
movl $.L_2__STRING.0, %edi #189.13
xorl %eax, %eax #189.13
movl 36(%rbx), %esi #189.13
movq 48(%rbx), %r15 #189.13
movl 24(%rbx), %r14d #189.13
..___tag_value_debug.79:
# printf(const char *__restrict__, ...)
call printf #189.13
..___tag_value_debug.80:
# LOE rbx r15 r12d r13d r14d
..B2.5: # Preds ..B2.4
# Execution count [1.10e+00]
movl 32(%rbx), %ecx #189.13
xorl %esi, %esi #189.13
addl $2, %ecx #189.13
testl %ecx, %ecx #189.13
jle ..B2.16 # Prob 10% #189.13
# LOE rbx r15 esi r12d r13d r14d
..B2.6: # Preds ..B2.5
# Execution count [9.90e-01]
movl %r12d, 56(%rsp) #189.13[spill]
xorl %ebp, %ebp #189.13
movl %r13d, 48(%rsp) #189.13[spill]
movl %r14d, %r13d #189.13
movl %esi, %r14d #189.13
# LOE rbx r15 ebp r13d r14d
..B2.7: # Preds ..B2.14 ..B2.6
# Execution count [5.50e+00]
movl $.L_2__STRING.1, %edi #189.13
movl %r14d, %esi #189.13
xorl %eax, %eax #189.13
..___tag_value_debug.83:
# printf(const char *__restrict__, ...)
call printf #189.13
..___tag_value_debug.84:
# LOE rbx r15 ebp r13d r14d
..B2.8: # Preds ..B2.7
# Execution count [5.50e+00]
movl 24(%rbx), %edx #189.13
xorl %eax, %eax #189.13
addl $2, %edx #189.13
testl %edx, %edx #189.13
jle ..B2.13 # Prob 10% #189.13
# LOE rax rbx r15 ebp r13d r14d
..B2.9: # Preds ..B2.8
# Execution count [4.95e+00]
movslq %ebp, %rbp #189.13
movq %r15, 64(%rsp) #189.13[spill]
lea (%r15,%rbp,8), %r12 #189.13
movq %rax, %r15 #189.13
# LOE rbx r12 r15 ebp r13d r14d
..B2.10: # Preds ..B2.11 ..B2.9
# Execution count [2.75e+01]
vmovsd (%r12,%r15,8), %xmm0 #189.13
movl $.L_2__STRING.2, %edi #189.13
movl $1, %eax #189.13
..___tag_value_debug.86:
# printf(const char *__restrict__, ...)
call printf #189.13
..___tag_value_debug.87:
# LOE rbx r12 r15 ebp r13d r14d
..B2.11: # Preds ..B2.10
# Execution count [2.75e+01]
movslq 24(%rbx), %rdx #189.13
incq %r15 #189.13
addq $2, %rdx #189.13
cmpq %rdx, %r15 #189.13
jl ..B2.10 # Prob 82% #189.13
# LOE rbx r12 r15 ebp r13d r14d
..B2.12: # Preds ..B2.11
# Execution count [4.95e+00]
movq 64(%rsp), %r15 #[spill]
# LOE rbx r15 ebp r13d r14d
..B2.13: # Preds ..B2.12 ..B2.8
# Execution count [5.50e+00]
movl $10, %edi #189.13
call putchar #189.13
# LOE rbx r15 ebp r13d r14d
..B2.14: # Preds ..B2.13
# Execution count [5.50e+00]
movl 32(%rbx), %eax #189.13
incl %r14d #189.13
addl $2, %eax #189.13
lea 2(%rbp,%r13), %ebp #189.13
cmpl %eax, %r14d #189.13
jl ..B2.7 # Prob 82% #189.13
# LOE rbx r15 ebp r13d r14d
..B2.15: # Preds ..B2.14
# Execution count [9.90e-01]
movl 56(%rsp), %r12d #[spill]
movl 48(%rsp), %r13d #[spill]
# LOE rbx r12d r13d
..B2.16: # Preds ..B2.15 ..B2.5
# Execution count [1.10e+00]
movq stdout(%rip), %rdi #189.13
# fflush(FILE *)
call fflush #189.13
# LOE rbx r12d r13d
..B2.17: # Preds ..B2.16 ..B2.3
# Execution count [5.00e+00]
movl $1140850688, %edi #191.9
..___tag_value_debug.91:
# MPI_Barrier(MPI_Comm)
call MPI_Barrier #191.9
..___tag_value_debug.92:
# LOE rbx r12d r13d
..B2.18: # Preds ..B2.17
# Execution count [5.00e+00]
incl %r12d #187.39
cmpl 40(%rbx), %r12d #187.25
jl ..B2.3 # Prob 82% #187.25
# LOE rbx r12d r13d
..B2.19: # Preds ..B2.18
# Execution count [9.00e-01]
movq (%rsp), %r12 #[spill]
.cfi_restore 12
movq 8(%rsp), %r13 #[spill]
.cfi_restore 13
movq 16(%rsp), %r14 #[spill]
.cfi_restore 14
movq 24(%rsp), %r15 #[spill]
.cfi_restore 15
movq 32(%rsp), %rbx #[spill]
.cfi_restore 3
movq 40(%rsp), %rbp #[spill]
.cfi_restore 6
# LOE rbx rbp r12 r13 r14 r15
..B2.20: # Preds ..B2.19 ..B2.1
# Execution count [1.00e+00]
addq $72, %rsp #193.1
.cfi_def_cfa_offset 8
ret #193.1
.align 16,0x90
# LOE
.cfi_endproc
# mark_end;
.type debug,@function
.size debug,.-debug
..LNdebug.1:
.data
# -- End debug
.text
.L_2__routine_start_solve_2:
# -- Begin solve
.text
# mark_begin;
.align 16,0x90
.globl solve
# --- solve(Solver *)
solve:
# parameter 1: %rdi
..B3.1: # Preds ..B3.0
# Execution count [1.00e+00]
.cfi_startproc
..___tag_value_solve.106:
..L107:
#196.1
pushq %rbp #196.1
.cfi_def_cfa_offset 16
movq %rsp, %rbp #196.1
.cfi_def_cfa 6, 16
.cfi_offset 6, -16
andq $-64, %rsp #196.1
pushq %r12 #196.1
pushq %r13 #196.1
pushq %r14 #196.1
pushq %r15 #196.1
pushq %rbx #196.1
subq $408, %rsp #196.1
movq %rdi, %r11 #196.1
vmovsd .L_2il0floatpacket.5(%rip), %xmm2 #212.29
xorl %esi, %esi #198.12
vmovsd .L_2il0floatpacket.9(%rip), %xmm9 #210.27
vmovsd (%r11), %xmm6 #208.21
vmulsd %xmm6, %xmm6, %xmm4 #208.34
vmulsd 72(%r11), %xmm2, %xmm3 #212.29
vdivsd %xmm4, %xmm9, %xmm11 #210.27
vmovsd 8(%r11), %xmm1 #209.21
vmulsd %xmm1, %xmm1, %xmm8 #209.34
vmulsd %xmm4, %xmm3, %xmm5 #212.42
vdivsd %xmm8, %xmm9, %xmm10 #211.27
vmovsd 64(%r11), %xmm0 #204.21
vmulsd %xmm8, %xmm5, %xmm7 #212.42
vaddsd %xmm9, %xmm0, %xmm1 #217.17
vfmadd231sd %xmm6, %xmm6, %xmm8 #212.56
vmulsd %xmm0, %xmm0, %xmm5 #215.27
vdivsd %xmm8, %xmm7, %xmm6 #212.56
movl 88(%r11), %eax #206.21
movl %eax, 288(%rsp) #206.21[spill]
.cfi_escape 0x10, 0x03, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf0, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0f, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x22
movl 24(%r11), %r13d #201.21
movl 28(%r11), %edx #202.21
movl 32(%r11), %r10d #203.21
movq 48(%r11), %r9 #213.21
movq 56(%r11), %rax #214.21
vcomisd %xmm5, %xmm1 #219.20
jb ..B3.32 # Prob 10% #219.20
# LOE rax r9 r11 edx esi r10d r13d xmm0 xmm1 xmm5 xmm6 xmm10 xmm11
..B3.2: # Preds ..B3.1
# Execution count [9.00e-01]
movl %r13d, %ecx #203.19
movl %r13d, %r8d #241.13
imull %r10d, %ecx #203.19
vxorpd %xmm4, %xmm4, %xmm4 #253.34
imull %r13d, %edx #253.34
vmovsd .L_2il0floatpacket.8(%rip), %xmm2 #226.49
vmovsd %xmm5, 264(%rsp) #223.9[spill]
vmovsd %xmm6, 328(%rsp) #223.9[spill]
vmovsd %xmm10, 336(%rsp) #223.9[spill]
shrl $1, %r8d #241.13
lea (%r13,%rcx), %edi #203.19
vcvtsi2sd %edx, %xmm4, %xmm4 #253.34
vmovdqu .L_2il0floatpacket.6(%rip), %ymm3 #235.13
vmovsd %xmm4, 272(%rsp) #223.9[spill]
movl %r8d, 176(%rsp) #241.13[spill]
lea (%rdi,%r10,2), %edx #203.19
movl %edx, 48(%rsp) #203.19[spill]
lea (%rcx,%r10,2), %r8d #203.19
movslq %edx, %rdx #242.17
movl %r10d, %ecx #246.9
movslq %r8d, %r8 #242.39
shrl $1, %ecx #246.9
movl %ecx, 240(%rsp) #246.9[spill]
movl $0, 280(%rsp) #219.5[spill]
lea (%r9,%rdx,8), %r15 #242.17
movq %r15, 88(%rsp) #242.17[spill]
lea (%r9,%r8,8), %r12 #242.39
movq %r12, 80(%rsp) #242.39[spill]
lea 24(%r15), %r14 #242.17
movq %r14, 128(%rsp) #242.17[spill]
lea 8(%r12), %rdi #242.39
movq %rdi, 104(%rsp) #242.39[spill]
subq %rdi, %r14 #241.13
movslq %r13d, %rdi #226.21
lea (%r13,%r13,2), %r12d #248.30
movl %r12d, 208(%rsp) #248.30[spill]
lea 4(%r13,%r13), %r12d #227.68
movl %r12d, 200(%rsp) #227.68[spill]
vmovsd %xmm11, 344(%rsp) #223.9[spill]
vmovsd %xmm0, 32(%rsp) #223.9[spill]
lea (,%rdi,8), %rcx #227.58
cmpq %rcx, %r14 #241.13
lea (%rax,%rdi,8), %rdx #226.21
movq %rdx, 304(%rsp) #226.21[spill]
movl $0, %edx #241.13
setg %dl #241.13
negq %r14 #241.13
xorl %eax, %eax #241.13
cmpq %rcx, %r14 #241.13
movq %rcx, 144(%rsp) #223.9[spill]
lea (%rcx,%rdi,8), %rbx #248.30
setg %al #241.13
lea (%r9,%rdi,8), %r14 #226.35
orl %eax, %edx #241.13
movl %r13d, %eax #235.13
addq %r9, %rbx #248.30
andl $-8, %eax #235.13
movq %rbx, 216(%rsp) #248.30[spill]
lea 24(%r14), %rbx #236.27
movl %eax, 40(%rsp) #235.13[spill]
lea 8(%r9), %rax #236.17
movq %rbx, 120(%rsp) #236.27[spill]
subq %rax, %rbx #235.13
movq %rbx, %r12 #235.13
lea 16(,%rdi,8), %r15 #226.21
negq %r12 #235.13
cmpq %rcx, %r12 #235.13
movl $0, %r12d #235.13
movq %rax, 136(%rsp) #236.17[spill]
setg %r12b #235.13
cmpq %rcx, %rbx #235.13
movl $0, %ebx #235.13
setg %bl #235.13
andq $63, %rax #235.13
movl %eax, 112(%rsp) #235.13[spill]
orl %ebx, %r12d #235.13
movl %eax, %ebx #235.13
negl %eax #235.13
andl $7, %ebx #235.13
movq %r15, 312(%rsp) #226.21[spill]
movl %r13d, %r15d #247.30
addl $64, %eax #235.13
negl %r15d #247.30
shrl $3, %eax #235.13
movl %r15d, 224(%rsp) #247.30[spill]
lea 2(%r13), %r15d #227.68
movl %ebx, 96(%rsp) #235.13[spill]
movl %eax, 296(%rsp) #235.13[spill]
movslq %r10d, %rbx #223.9
movl %r12d, 160(%rsp) #223.9[spill]
xorl %r12d, %r12d #223.9
movl %edx, 152(%rsp) #223.9[spill]
movq %rdi, 352(%rsp) #223.9[spill]
movl %r8d, 56(%rsp) #223.9[spill]
movq %r9, 320(%rsp) #223.9[spill]
movl %r10d, 248(%rsp) #223.9[spill]
movq %r11, 256(%rsp) #223.9[spill]
# LOE rbx r12 r14 esi r13d r15d xmm1
..B3.3: # Preds ..B3.30 ..B3.2
# Execution count [2.62e+00]
movl 280(%rsp), %eax #219.5[spill]
incl %eax #219.5
movl %eax, 280(%rsp) #219.5[spill]
lea -1(%rax), %edx #252.9
cmpl 288(%rsp), %edx #219.36[spill]
jge ..B3.31 # Prob 20% #219.36
# LOE rbx r12 r14 esi r13d r15d xmm1
..B3.4: # Preds ..B3.3
# Execution count [2.09e+00]
movq 256(%rsp), %rax #221.9[spill]
movl $738197504, %ecx #221.9
movl %ecx, 64(%rsp) #221.9
movl %ecx, 68(%rsp) #221.9
movl %ecx, 72(%rsp) #221.9
movl %ecx, 76(%rsp) #221.9
movl 36(%rax), %ecx #221.9
movq %r12, 368(%rsp) #220.9
lea 1(%rcx), %r10d #221.9
cmpl 40(%rax), %r10d #221.9
jge ..B3.8 # Prob 78% #221.9
# LOE rax rbx r12 r14 ecx r10d r13d r15d
..B3.5: # Preds ..B3.4
# Execution count [4.60e-01]
addq $-16, %rsp #221.9
movl %r10d, %ecx #221.9
lea 80(%rsp), %r8 #221.9
movl $1140850688, %r9d #221.9
movl 24(%rax), %esi #221.9
movl 32(%rax), %edx #221.9
movq 48(%rax), %rax #221.9
movl %edx, -56(%r8) #221.9[spill]
lea 2(%rsi), %r11d #221.9
movl %r11d, 16(%rsp) #221.9[spill]
imull %edx, %r11d #221.9
movl $1275070475, %edx #221.9
movslq %r11d, %r11 #221.9
movq %r8, (%rsp) #221.9
movl $1, %r8d #221.9
movq %rax, 32(%rsp) #221.9[spill]
movl %r10d, 40(%rsp) #221.9[spill]
lea 8(%rax,%r11,8), %rdi #221.9
vzeroupper #221.9
..___tag_value_solve.159:
# MPI_Isend(const void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Isend #221.9
..___tag_value_solve.160:
# LOE rbx r12 r14 r13d r15d
..B3.82: # Preds ..B3.5
# Execution count [4.60e-01]
movl 40(%rsp), %r10d #[spill]
movq 32(%rsp), %rax #[spill]
# LOE rax rbx r12 r14 r10d r13d r15d
..B3.6: # Preds ..B3.82
# Execution count [4.60e-01]
movl $1275070475, %edx #221.9
movl 24(%rsp), %r11d #221.9[spill]
movl %r10d, %ecx #221.9
incl %r11d #221.9
movl $2, %r8d #221.9
imull 16(%rsp), %r11d #221.9[spill]
movl $1140850688, %r9d #221.9
movslq %r11d, %r11 #221.9
lea 8(%rax,%r11,8), %rdi #221.9
lea 84(%rsp), %rax #221.9
movq %rax, (%rsp) #221.9
movq 188(%rax), %rax #221.9[spill]
movl 24(%rax), %esi #221.9
..___tag_value_solve.166:
# MPI_Irecv(void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Irecv #221.9
..___tag_value_solve.167:
# LOE rbx r12 r14 r13d r15d
..B3.83: # Preds ..B3.6
# Execution count [4.60e-01]
addq $16, %rsp #221.9
# LOE rbx r12 r14 r13d r15d
..B3.7: # Preds ..B3.83
# Execution count [4.60e-01]
movq 256(%rsp), %rax #221.9[spill]
movl 36(%rax), %ecx #221.9
# LOE rbx r12 r14 ecx r13d r15d
..B3.8: # Preds ..B3.4 ..B3.7
# Execution count [2.09e+00]
testl %ecx, %ecx #221.9
jle ..B3.11 # Prob 40% #221.9
# LOE rbx r12 r14 ecx r13d r15d
..B3.9: # Preds ..B3.8
# Execution count [1.25e+00]
addq $-16, %rsp #221.9
decl %ecx #221.9
movl $1275070475, %edx #221.9
lea 88(%rsp), %rax #221.9
movl $2, %r8d #221.9
movl $1140850688, %r9d #221.9
movq %rax, (%rsp) #221.9
movq 184(%rax), %rax #221.9[spill]
movl %ecx, 208(%rsp) #221.9[spill]
movq 48(%rax), %r10 #221.9
movslq 24(%rax), %r11 #221.9
movl 24(%rax), %esi #221.9
movq %r10, 200(%rsp) #221.9[spill]
lea 24(%r10,%r11,8), %rdi #221.9
vzeroupper #221.9
..___tag_value_solve.172:
# MPI_Isend(const void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Isend #221.9
..___tag_value_solve.173:
# LOE rbx r12 r14 r13d r15d
..B3.84: # Preds ..B3.9
# Execution count [1.25e+00]
movl 208(%rsp), %ecx #[spill]
# LOE rbx r12 r14 ecx r13d r15d
..B3.10: # Preds ..B3.84
# Execution count [1.25e+00]
movl $1275070475, %edx #221.9
movq 200(%rsp), %rdi #221.9[spill]
lea 92(%rsp), %rax #221.9
addq $8, %rdi #221.9
movl $1, %r8d #221.9
movl $1140850688, %r9d #221.9
movq %rax, (%rsp) #221.9
movq 180(%rax), %r10 #221.9[spill]
movl 24(%r10), %esi #221.9
..___tag_value_solve.177:
# MPI_Irecv(void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Irecv #221.9
..___tag_value_solve.178:
# LOE rbx r12 r14 r13d r15d
..B3.85: # Preds ..B3.10
# Execution count [1.25e+00]
addq $16, %rsp #221.9
# LOE rbx r12 r14 r13d r15d
..B3.11: # Preds ..B3.85 ..B3.8
# Execution count [2.09e+00]
movl $4, %edi #221.9
lea 64(%rsp), %rsi #221.9
movl $1, %edx #221.9
vzeroupper #221.9
..___tag_value_solve.179:
# MPI_Waitall(int, MPI_Request *, MPI_Status *)
call MPI_Waitall #221.9
..___tag_value_solve.180:
# LOE rbx r12 r14 r13d r15d
..B3.12: # Preds ..B3.11
# Execution count [2.09e+00]
movq %r12, %rcx #223.9
cmpl $0, 248(%rsp) #223.41[spill]
jle ..B3.75 # Prob 10% #223.41
# LOE rcx rbx r12 r14 r13d r15d
..B3.13: # Preds ..B3.12
# Execution count [9.42e+00]
testl %r13d, %r13d #224.40
jle ..B3.72 # Prob 10% #224.40
# LOE rcx rbx r12 r14 r13d r15d
..B3.14: # Preds ..B3.13
# Execution count [1.83e+00]
vmovsd .L_2il0floatpacket.8(%rip), %xmm0 #
vmovsd 328(%rsp), %xmm1 #[spill]
vmovsd 336(%rsp), %xmm2 #[spill]
vmovsd 344(%rsp), %xmm3 #[spill]
movq 304(%rsp), %rdi #[spill]
movq 312(%rsp), %rdx #[spill]
movq 320(%rsp), %rsi #[spill]
# LOE rdx rcx rbx rsi rdi r12 r14 r13d r15d xmm0 xmm1 xmm2 xmm3
..B3.15: # Preds ..B3.19 ..B3.14
# Execution count [9.42e+00]
movq %rcx, %r8 #227.58
movl %ecx, %eax #226.17
imulq %rdx, %r8 #227.58
imull %r15d, %eax #227.68
movl %r13d, 360(%rsp) #227.68[spill]
lea (%rax,%r13,2), %eax #227.68
movslq %eax, %rax #227.68
movq %r12, %r9 #227.58
movq 352(%rsp), %r13 #227.68[spill]
lea (%rsi,%r8), %r10 #227.38
lea (%rdi,%r8), %r11 #226.21
addq %r14, %r8 #227.58
lea (%rsi,%rax,8), %rax #227.68
.align 16,0x90
# LOE rax rdx rcx rbx rsi rdi r8 r9 r10 r11 r12 r13 r14 r15d xmm0 xmm1 xmm2 xmm3
..B3.16: # Preds ..B3.16 ..B3.15
# Execution count [5.23e+01]
vmovsd 24(%r8,%r9,8), %xmm10 #226.55
vmulsd %xmm10, %xmm0, %xmm7 #227.58
vmovsd 16(%r8,%r9,8), %xmm6 #226.35
vmovsd 8(%r10,%r9,8), %xmm4 #227.38
vsubsd %xmm7, %xmm6, %xmm8 #226.55
vsubsd %xmm7, %xmm4, %xmm5 #227.58
vaddsd 32(%r8,%r9,8), %xmm8, %xmm12 #226.65
vaddsd 40(%rax,%r9,8), %xmm5, %xmm9 #227.68
vfnmadd213sd 24(%r11,%r9,8), %xmm3, %xmm12 #226.17
vfnmadd231sd %xmm2, %xmm9, %xmm12 #226.17
vfnmadd231sd %xmm1, %xmm12, %xmm10 #229.17
vmovsd %xmm10, 24(%r8,%r9,8) #229.17
vmovsd 368(%rsp), %xmm11 #230.17
incq %r9 #224.13
vfmadd213sd %xmm11, %xmm12, %xmm12 #230.17
vmovsd %xmm12, 368(%rsp) #230.17
cmpq %r13, %r9 #224.13
jb ..B3.16 # Prob 82% #224.13
# LOE rax rdx rcx rbx rsi rdi r8 r9 r10 r11 r12 r13 r14 r15d xmm0 xmm1 xmm2 xmm3
..B3.17: # Preds ..B3.16
# Execution count [9.42e+00]
incq %rcx #223.9
movl 360(%rsp), %r13d #[spill]
cmpq %rbx, %rcx #223.9
jae ..B3.35 # Prob 18% #223.9
# LOE rdx rcx rbx rsi rdi r12 r14 r13d r15d xmm0 xmm1 xmm2 xmm3
..B3.19: # Preds ..B3.74 ..B3.17 ..B3.21
# Execution count [8.43e+00]
testl %r13d, %r13d #224.40
jg ..B3.15 # Prob 90% #224.40
# LOE rdx rcx rbx rsi rdi r12 r14 r13d r15d xmm0 xmm1 xmm2 xmm3
..B3.21: # Preds ..B3.19
# Execution count [7.19e-01]: Infreq
incq %rcx #223.9
cmpq %rbx, %rcx #223.9
jb ..B3.19 # Prob 82% #223.9
# LOE rdx rcx rbx rsi rdi r12 r14 r13d r15d xmm0 xmm1 xmm2 xmm3
..B3.22: # Preds ..B3.21
# Execution count [1.29e-01]: Infreq
vmovsd %xmm1, 328(%rsp) #[spill]
vmovsd %xmm2, 336(%rsp) #[spill]
vmovsd %xmm3, 344(%rsp) #[spill]
movq %rsi, 320(%rsp) #[spill]
# LOE rbx r12 r14 r13d r15d
..B3.23: # Preds ..B3.73 ..B3.72 ..B3.22 ..B3.44 ..B3.40
#
# Execution count [2.09e+00]: Infreq
xorl %r8d, %r8d #246.9
movl $1, %edx #246.9
xorl %ecx, %ecx #247.13
cmpl $0, 240(%rsp) #246.9[spill]
je ..B3.27 # Prob 10% #246.9
# LOE rbx r12 r14 edx ecx r8d r13d r15d
..B3.24: # Preds ..B3.23
# Execution count [1.88e+00]: Infreq
movl 200(%rsp), %edi #[spill]
movl 208(%rsp), %esi #[spill]
movl 240(%rsp), %eax #[spill]
movq 320(%rsp), %rdx #[spill]
.align 16,0x90
# LOE rdx rbx r12 r14 eax ecx esi edi r8d r13d r15d
..B3.25: # Preds ..B3.25 ..B3.24
# Execution count [5.23e+00]: Infreq
movl %ecx, %r9d #247.30
incl %r8d #246.9
subl %r13d, %r9d #247.30
lea (%r9,%r13,2), %r10d #247.30
movslq %r10d, %r10 #247.30
lea (%rcx,%r13,2), %r9d #248.30
movslq %r9d, %r9 #248.30
movq 24(%rdx,%r10,8), %r11 #247.30
movq %r11, 16(%rdx,%r10,8) #247.13
lea (%rsi,%rcx), %r10d #227.68
movq 16(%rdx,%r9,8), %r11 #248.30
addl %edi, %ecx #246.9
movslq %r10d, %r10 #248.30
movq %r11, 24(%rdx,%r9,8) #248.13
movq 40(%rdx,%r9,8), %r11 #247.30
movq %r11, 32(%rdx,%r9,8) #247.13
movq 32(%rdx,%r10,8), %r9 #248.30
movq %r9, 40(%rdx,%r10,8) #248.13
cmpl %eax, %r8d #246.9
jb ..B3.25 # Prob 64% #246.9
# LOE rdx rbx r12 r14 eax ecx esi edi r8d r13d r15d
..B3.26: # Preds ..B3.25
# Execution count [1.88e+00]: Infreq
lea 1(%r8,%r8), %edx #247.13
# LOE rbx r12 r14 edx r13d r15d
..B3.27: # Preds ..B3.26 ..B3.23
# Execution count [2.09e+00]: Infreq
lea -1(%rdx), %eax #246.9
cmpl 248(%rsp), %eax #246.9[spill]
jae ..B3.29 # Prob 10% #246.9
# LOE rbx r12 r14 edx r13d r15d
..B3.28: # Preds ..B3.27
# Execution count [1.88e+00]: Infreq
imull %r15d, %edx #247.30
addl 224(%rsp), %edx #247.30[spill]
movslq %edx, %rdx #247.30
movq 216(%rsp), %rsi #248.30[spill]
movq 8(%r14,%rdx,8), %rax #247.30
movq %rax, (%r14,%rdx,8) #247.13
movq (%rsi,%rdx,8), %rcx #248.30
movq %rcx, 8(%rsi,%rdx,8) #248.13
# LOE rbx r12 r14 r13d r15d
..B3.29: # Preds ..B3.27 ..B3.44 ..B3.76 ..B3.77 ..B3.78
# ..B3.28
# Execution count [2.09e+00]: Infreq
movl $1, %edx #251.9
lea 368(%rsp), %rdi #251.9
movl $1275070475, %ecx #251.9
lea 232(%rsp), %rsi #251.9
movl $1476395011, %r8d #251.9
movl $1140850688, %r9d #251.9
vzeroupper #251.9
..___tag_value_solve.203:
# MPI_Allreduce(const void *, void *, int, MPI_Datatype, MPI_Op, MPI_Comm)
call MPI_Allreduce #251.9
..___tag_value_solve.204:
# LOE rbx r12 r14 r13d r15d
..B3.30: # Preds ..B3.29
# Execution count [2.09e+00]: Infreq
vmovsd 232(%rsp), %xmm0 #252.15
vdivsd 272(%rsp), %xmm0, %xmm1 #253.34[spill]
vsqrtsd %xmm1, %xmm1, %xmm1 #253.15
movl 280(%rsp), %esi #259.9[spill]
vcomisd 264(%rsp), %xmm1 #219.20[spill]
jae ..B3.3 # Prob 82% #219.20
# LOE rbx r12 r14 esi r13d r15d xmm1
..B3.31: # Preds ..B3.3 ..B3.30
# Execution count [3.77e-01]: Infreq
vmovsd 32(%rsp), %xmm0 #[spill]
movq 256(%rsp), %r11 #[spill]
# LOE r11 esi xmm0 xmm1
..B3.32: # Preds ..B3.31 ..B3.1
# Execution count [1.00e+00]: Infreq
cmpl $0, 36(%r11) #262.25
jne ..B3.34 # Prob 78% #262.25
# LOE esi xmm0 xmm1
..B3.33: # Preds ..B3.32
# Execution count [2.20e-01]: Infreq
movl $.L_2__STRING.6, %edi #263.9
xorl %eax, %eax #263.9
vmovsd %xmm1, 368(%rsp) #217.5
vzeroupper #263.9
vmovsd %xmm1, (%rsp) #263.9[spill]
vmovsd %xmm0, 32(%rsp) #263.9[spill]
..___tag_value_solve.211:
# printf(const char *__restrict__, ...)
call printf #263.9
..___tag_value_solve.212:
# LOE
..B3.89: # Preds ..B3.33
# Execution count [2.20e-01]: Infreq
vmovsd 32(%rsp), %xmm0 #[spill]
vmovsd (%rsp), %xmm1 #[spill]
# LOE xmm0 xmm1
..B3.34: # Preds ..B3.89 ..B3.32
# Execution count [1.00e+00]: Infreq
vcmpgtsd %xmm1, %xmm0, %xmm0 #266.16
vmovd %xmm0, %eax #266.16
negl %eax #266.16
vzeroupper #266.16
addq $408, %rsp #266.16
.cfi_restore 3
popq %rbx #266.16
.cfi_restore 15
popq %r15 #266.16
.cfi_restore 14
popq %r14 #266.16
.cfi_restore 13
popq %r13 #266.16
.cfi_restore 12
popq %r12 #266.16
movq %rbp, %rsp #266.16
popq %rbp #266.16
.cfi_def_cfa 7, 8
.cfi_restore 6
ret #266.16
.cfi_def_cfa 6, 16
.cfi_escape 0x10, 0x03, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd8, 0xff, 0xff, 0xff, 0x22
.cfi_offset 6, -16
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf0, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0f, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x22
# LOE
..B3.35: # Preds ..B3.17
# Execution count [1.70e+00]: Infreq
movq 256(%rsp), %rax #234.13[spill]
vmovsd %xmm1, 328(%rsp) #[spill]
vmovsd %xmm2, 336(%rsp) #[spill]
movl 36(%rax), %ecx #234.13
vmovsd %xmm3, 344(%rsp) #[spill]
movq %rsi, 320(%rsp) #[spill]
testl %ecx, %ecx #234.29
jne ..B3.40 # Prob 50% #234.29
# LOE rax rbx r12 r14 ecx r13d r15d
..B3.36: # Preds ..B3.35 ..B3.76
# Execution count [5.23e-03]: Infreq
cmpl $12, %r13d #235.13
jle ..B3.64 # Prob 10% #235.13
# LOE rbx r12 r14 ecx r13d r15d
..B3.37: # Preds ..B3.36
# Execution count [1.05e+00]: Infreq
cmpl $0, 160(%rsp) #235.13[spill]
je ..B3.45 # Prob 10% #235.13
# LOE rbx r12 r14 ecx r13d r15d
..B3.38: # Preds ..B3.37
# Execution count [1.05e+00]: Infreq
movq 136(%rsp), %rdi #235.13[spill]
movq 120(%rsp), %rsi #235.13[spill]
movq 144(%rsp), %rdx #235.13[spill]
movl %ecx, 168(%rsp) #235.13[spill]
call __intel_skx_avx512_memcpy #235.13
# LOE rbx r12 r14 r13d r15d
..B3.88: # Preds ..B3.38
# Execution count [1.05e+00]: Infreq
movl 168(%rsp), %ecx #[spill]
# LOE rbx r12 r14 ecx r13d r15d
..B3.39: # Preds ..B3.88 ..B3.53
# Execution count [1.05e+00]: Infreq
movq 256(%rsp), %rax #240.30[spill]
movl 40(%rax), %edx #240.30
decl %edx #240.45
cmpl %edx, %ecx #240.45
je ..B3.42 # Prob 50% #240.45
jmp ..B3.44 # Prob 100% #240.45
# LOE rbx r12 r14 r13d r15d
..B3.40: # Preds ..B3.35
# Execution count [8.48e-01]: Infreq
movl 40(%rax), %edx #240.30
decl %edx #240.45
cmpl %edx, %ecx #240.45
jne ..B3.23 # Prob 50% #240.45
# LOE rbx r12 r14 r13d r15d
..B3.41: # Preds ..B3.40 ..B3.62 ..B3.78
# Execution count [0.00e+00]: Infreq
cmpl $12, %r13d #241.13
jle ..B3.66 # Prob 10% #241.13
# LOE rbx r12 r14 r13d r15d
..B3.42: # Preds ..B3.41 ..B3.39
# Execution count [1.05e+00]: Infreq
cmpl $0, 152(%rsp) #241.13[spill]
je ..B3.66 # Prob 10% #241.13
# LOE rbx r12 r14 r13d r15d
..B3.43: # Preds ..B3.42
# Execution count [1.05e+00]: Infreq
vzeroupper #241.13
movq 128(%rsp), %rdi #241.13[spill]
movq 104(%rsp), %rsi #241.13[spill]
movq 144(%rsp), %rdx #241.13[spill]
call __intel_skx_avx512_memcpy #241.13
# LOE rbx r12 r14 r13d r15d
..B3.44: # Preds ..B3.43 ..B3.70 ..B3.39 ..B3.62 ..B3.71
#
# Execution count [5.38e-01]: Infreq
cmpl $0, 248(%rsp) #246.41[spill]
jg ..B3.23 # Prob 50% #246.41
jmp ..B3.29 # Prob 100% #246.41
# LOE rbx r12 r14 r13d r15d
..B3.45: # Preds ..B3.37
# Execution count [1.99e-01]: Infreq
cmpl $30, %r13d #235.13
jl ..B3.63 # Prob 10% #235.13
# LOE rbx r12 r14 ecx r13d r15d
..B3.46: # Preds ..B3.45
# Execution count [1.05e+00]: Infreq
movl 112(%rsp), %edi #235.13[spill]
cmpl $0, 96(%rsp) #235.13[spill]
je ..B3.48 # Prob 50% #235.13
# LOE rbx r12 r14 ecx edi r13d r15d
..B3.47: # Preds ..B3.46
# Execution count [5.23e-01]: Infreq
xorl %edi, %edi #235.13
jmp ..B3.50 # Prob 100% #235.13
# LOE rbx r12 r14 ecx edi r13d r15d
..B3.48: # Preds ..B3.46
# Execution count [5.23e-01]: Infreq
cmpl $0, 112(%rsp) #235.13[spill]
je ..B3.50 # Prob 50% #235.13
# LOE rbx r12 r14 ecx edi r13d r15d
..B3.49: # Preds ..B3.48
# Execution count [5.81e+00]: Infreq
movl 296(%rsp), %edi #235.13[spill]
cmpl %edi, %r13d #235.13
cmovl %r13d, %edi #235.13
# LOE rbx r12 r14 ecx edi r13d r15d
..B3.50: # Preds ..B3.47 ..B3.49 ..B3.48
# Execution count [1.16e+00]: Infreq
movl %r13d, %esi #235.13
subl %edi, %esi #235.13
andl $7, %esi #235.13
negl %esi #235.13
addl %r13d, %esi #235.13
cmpl $1, %edi #235.13
jb ..B3.54 # Prob 50% #235.13
# LOE rbx r12 r14 ecx esi edi r13d r15d
..B3.51: # Preds ..B3.50
# Execution count [1.05e+00]: Infreq
vmovdqu .L_2il0floatpacket.7(%rip), %ymm1 #235.13
movq %r12, %rdx #235.13
vmovdqu .L_2il0floatpacket.6(%rip), %ymm3 #235.13
vpbroadcastd %edi, %ymm0 #235.13
movslq %edi, %rax #235.13
movq 320(%rsp), %r8 #235.13[spill]
# LOE rax rdx rbx r8 r12 r14 ecx esi edi r13d r15d ymm0 ymm1 ymm3
..B3.52: # Preds ..B3.52 ..B3.51
# Execution count [5.81e+00]: Infreq
vpcmpgtd %ymm1, %ymm0, %k1 #235.13
vpaddd %ymm3, %ymm1, %ymm1 #235.13
vmovupd 24(%r14,%rdx,8), %zmm2{%k1}{z} #236.27
vmovupd %zmm2, 8(%r8,%rdx,8){%k1} #236.17
addq $8, %rdx #235.13
cmpq %rax, %rdx #235.13
jb ..B3.52 # Prob 82% #235.13
# LOE rax rdx rbx r8 r12 r14 ecx esi edi r13d r15d ymm0 ymm1 ymm3
..B3.53: # Preds ..B3.52
# Execution count [1.05e+00]: Infreq
cmpl %edi, %r13d #235.13
je ..B3.39 # Prob 10% #235.13
# LOE rbx r12 r14 ecx esi edi r13d r15d
..B3.54: # Preds ..B3.53 ..B3.50 ..B3.63
# Execution count [5.81e+00]: Infreq
movslq %esi, %rax #235.13
lea 8(%rdi), %edx #235.13
cmpl %edx, %esi #235.13
jl ..B3.58 # Prob 50% #235.13
# LOE rax rbx r12 r14 ecx edi r13d r15d
..B3.55: # Preds ..B3.54
# Execution count [1.05e+00]: Infreq
movslq %edi, %rdi #235.13
movq 320(%rsp), %rdx #235.13[spill]
# LOE rax rdx rbx rdi r12 r14 ecx r13d r15d
..B3.56: # Preds ..B3.56 ..B3.55
# Execution count [5.81e+00]: Infreq
vmovups 24(%r14,%rdi,8), %zmm0 #236.27
vmovupd %zmm0, 8(%rdx,%rdi,8) #236.17
addq $8, %rdi #235.13
cmpq %rax, %rdi #235.13
jb ..B3.56 # Prob 82% #235.13
# LOE rax rdx rbx rdi r12 r14 ecx r13d r15d
..B3.58: # Preds ..B3.56 ..B3.54 ..B3.65
# Execution count [1.16e+00]: Infreq
cmpq 352(%rsp), %rax #235.13[spill]
jae ..B3.62 # Prob 10% #235.13
# LOE rax rbx r12 r14 ecx r13d r15d
..B3.59: # Preds ..B3.58
# Execution count [1.05e+00]: Infreq
movq 352(%rsp), %rsi #[spill]
movq 320(%rsp), %rdi #[spill]
# LOE rax rbx rsi rdi r12 r14 ecx r13d r15d
..B3.60: # Preds ..B3.60 ..B3.59
# Execution count [5.81e+00]: Infreq
movq 24(%r14,%rax,8), %rdx #236.27
movq %rdx, 8(%rdi,%rax,8) #236.17
incq %rax #235.13
cmpq %rsi, %rax #235.13
jb ..B3.60 # Prob 82% #235.13
# LOE rax rbx rsi rdi r12 r14 ecx r13d r15d
..B3.62: # Preds ..B3.60 ..B3.58
# Execution count [0.00e+00]: Infreq
movq 256(%rsp), %rax #240.30[spill]
movl 40(%rax), %edx #240.30
decl %edx #240.45
cmpl %edx, %ecx #240.45
je ..B3.41 # Prob 50% #240.45
jmp ..B3.44 # Prob 100% #240.45
# LOE rbx r12 r14 r13d r15d
..B3.63: # Preds ..B3.64 ..B3.45
# Execution count [1.05e-01]: Infreq
movl 40(%rsp), %esi #235.13[spill]
xorl %edi, %edi #235.13
jmp ..B3.54 # Prob 100% #235.13
# LOE rbx r12 r14 ecx esi edi r13d r15d
..B3.64: # Preds ..B3.36
# Execution count [9.42e-01]: Infreq
cmpl $8, %r13d #235.13
jge ..B3.63 # Prob 90% #235.13
# LOE rbx r12 r14 ecx r13d r15d
..B3.65: # Preds ..B3.64
# Execution count [1.05e-01]: Infreq
movq %r12, %rax #235.13
jmp ..B3.58 # Prob 100% #235.13
# LOE rax rbx r12 r14 ecx r13d r15d
..B3.66: # Preds ..B3.42 ..B3.41
# Execution count [1.16e+00]: Infreq
movl $1, %edx #241.13
xorl %r8d, %r8d #241.13
cmpl $0, 176(%rsp) #241.13[spill]
je ..B3.70 # Prob 10% #241.13
# LOE rbx r12 r14 edx r8d r13d r15d
..B3.67: # Preds ..B3.66
# Execution count [1.05e+00]: Infreq
movl 56(%rsp), %edi #[spill]
movl 48(%rsp), %esi #[spill]
movl 176(%rsp), %ecx #[spill]
movq 320(%rsp), %rdx #[spill]
# LOE rdx rbx r12 r14 ecx esi edi r8d r13d r15d
..B3.68: # Preds ..B3.68 ..B3.67
# Execution count [2.91e+00]: Infreq
lea (%rdi,%r8,2), %r9d #203.19
movslq %r9d, %r9 #242.39
lea (%rsi,%r8,2), %eax #203.19
movslq %eax, %rax #242.17
incl %r8d #241.13
movq 8(%rdx,%r9,8), %r10 #242.39
movq %r10, 24(%rdx,%rax,8) #242.17
movq 16(%rdx,%r9,8), %r11 #242.39
movq %r11, 32(%rdx,%rax,8) #242.17
cmpl %ecx, %r8d #241.13
jb ..B3.68 # Prob 64% #241.13
# LOE rdx rbx r12 r14 ecx esi edi r8d r13d r15d
..B3.69: # Preds ..B3.68
# Execution count [1.05e+00]: Infreq
lea 1(%r8,%r8), %edx #242.17
# LOE rbx r12 r14 edx r13d r15d
..B3.70: # Preds ..B3.69 ..B3.66
# Execution count [1.16e+00]: Infreq
lea -1(%rdx), %eax #241.13
cmpl %r13d, %eax #241.13
jae ..B3.44 # Prob 10% #241.13
# LOE rbx r12 r14 edx r13d r15d
..B3.71: # Preds ..B3.70
# Execution count [1.05e+00]: Infreq
movslq %edx, %rdx #242.39
movq 80(%rsp), %rax #242.39[spill]
movq 88(%rsp), %rsi #242.17[spill]
movq (%rax,%rdx,8), %rcx #242.39
movq %rcx, 16(%rsi,%rdx,8) #242.17
jmp ..B3.44 # Prob 100% #242.17
# LOE rbx r12 r14 r13d r15d
..B3.72: # Preds ..B3.13
# Execution count [1.88e-01]: Infreq
cmpq $1, %rbx #223.9
jbe ..B3.23 # Prob 18% #223.9
# LOE rbx r12 r14 r13d r15d
..B3.73: # Preds ..B3.72
# Execution count [1.54e-01]: Infreq
movl $2, %ecx #223.9
cmpq $2, %rbx #223.9
jbe ..B3.23 # Prob 18% #223.9
# LOE rcx rbx r12 r14 r13d r15d
..B3.74: # Preds ..B3.73
# Execution count [7.84e+00]: Infreq
vmovsd .L_2il0floatpacket.8(%rip), %xmm0 #
vmovsd 328(%rsp), %xmm1 #[spill]
vmovsd 336(%rsp), %xmm2 #[spill]
vmovsd 344(%rsp), %xmm3 #[spill]
movq 304(%rsp), %rdi #[spill]
movq 312(%rsp), %rdx #[spill]
movq 320(%rsp), %rsi #[spill]
jmp ..B3.19 # Prob 100% #
# LOE rdx rcx rbx rsi rdi r12 r14 r13d r15d xmm0 xmm1 xmm2 xmm3
..B3.75: # Preds ..B3.12
# Execution count [2.09e-01]: Infreq
movq 256(%rsp), %rax #234.13[spill]
movl 36(%rax), %ecx #234.13
testl %ecx, %ecx #234.29
jne ..B3.77 # Prob 50% #234.29
# LOE rax rbx r12 r14 ecx r13d r15d
..B3.76: # Preds ..B3.75
# Execution count [1.05e-01]: Infreq
testl %r13d, %r13d #235.40
jg ..B3.36 # Prob 50% #235.40
jmp ..B3.29 # Prob 100% #235.40
# LOE rbx r12 r14 ecx r13d r15d
..B3.77: # Preds ..B3.75
# Execution count [6.23e-01]: Infreq
movl 40(%rax), %edx #240.30
decl %edx #240.45
cmpl %edx, %ecx #240.45
jne ..B3.29 # Prob 50% #240.45
# LOE rbx r12 r14 r13d r15d
..B3.78: # Preds ..B3.77
# Execution count [3.11e-01]: Infreq
testl %r13d, %r13d #241.40
jg ..B3.41 # Prob 50% #241.40
jmp ..B3.29 # Prob 100% #241.40
.align 16,0x90
# LOE rbx r12 r14 r13d r15d
.cfi_endproc
# mark_end;
.type solve,@function
.size solve,.-solve
..LNsolve.2:
.data
# -- End solve
.text
.L_2__routine_start_solveRB_3:
# -- Begin solveRB
.text
# mark_begin;
.align 16,0x90
.globl solveRB
# --- solveRB(Solver *)
solveRB:
# parameter 1: %rdi
..B4.1: # Preds ..B4.0
# Execution count [1.00e+00]
.cfi_startproc
..___tag_value_solveRB.273:
..L274:
#273.1
pushq %r14 #273.1
.cfi_def_cfa_offset 16
.cfi_offset 14, -16
pushq %r15 #273.1
.cfi_def_cfa_offset 24
.cfi_offset 15, -24
pushq %rbx #273.1
.cfi_def_cfa_offset 32
.cfi_offset 3, -32
pushq %rbp #273.1
.cfi_def_cfa_offset 40
.cfi_offset 6, -40
subq $280, %rsp #273.1
.cfi_def_cfa_offset 320
movq %rdi, %r10 #273.1
vmovsd .L_2il0floatpacket.5(%rip), %xmm2 #289.29
xorl %esi, %esi #275.12
vmovsd .L_2il0floatpacket.9(%rip), %xmm9 #287.27
vmovsd (%r10), %xmm6 #285.21
vmulsd %xmm6, %xmm6, %xmm4 #285.34
vmulsd 72(%r10), %xmm2, %xmm3 #289.29
vdivsd %xmm4, %xmm9, %xmm11 #287.27
vmovsd 8(%r10), %xmm1 #286.21
vmulsd %xmm1, %xmm1, %xmm8 #286.34
vmulsd %xmm4, %xmm3, %xmm5 #289.42
vdivsd %xmm8, %xmm9, %xmm10 #288.27
vmovsd 64(%r10), %xmm0 #281.21
vmulsd %xmm0, %xmm0, %xmm4 #293.26
vaddsd %xmm9, %xmm0, %xmm1 #295.17
vmulsd %xmm8, %xmm5, %xmm7 #289.42
vfmadd231sd %xmm6, %xmm6, %xmm8 #289.56
vcomisd %xmm4, %xmm1 #297.20
vdivsd %xmm8, %xmm7, %xmm5 #289.56
movl 24(%r10), %ecx #278.21
movl 28(%r10), %eax #279.21
movl 32(%r10), %r15d #280.21
movl 88(%r10), %r9d #283.21
movq 48(%r10), %r8 #290.21
movq 56(%r10), %rdi #291.21
jb ..B4.38 # Prob 10% #297.20
# LOE rdi r8 r10 r12 r13 eax ecx esi r9d r15d xmm0 xmm1 xmm4 xmm5 xmm10 xmm11
..B4.2: # Preds ..B4.1
# Execution count [9.00e-01]
imull %ecx, %eax #331.37
vxorpd %xmm3, %xmm3, %xmm3 #331.37
vmovsd .L_2il0floatpacket.8(%rip), %xmm2 #309.48
vmovsd %xmm4, 176(%rsp) #322.35[spill]
vmovsd %xmm5, 232(%rsp) #322.35[spill]
vmovsd %xmm10, 224(%rsp) #322.35[spill]
movslq %ecx, %rcx #321.35
movl %r15d, %ebx #325.9
movl %ecx, %edx #326.30
lea 2(%rcx), %r11d #310.67
negl %edx #326.30
xorl %r14d, %r14d #297.5
movl %edx, 104(%rsp) #326.30[spill]
lea 4(%rcx,%rcx), %edx #310.67
movl %edx, 48(%rsp) #310.67[spill]
movl %ecx, %edx #280.19
imull %r15d, %edx #280.19
lea (,%rcx,8), %rbp #321.35
vmovsd %xmm11, 216(%rsp) #322.35[spill]
vmovsd %xmm0, 24(%rsp) #322.35[spill]
vcvtsi2sd %eax, %xmm3, %xmm3 #331.37
movl %r11d, 88(%rsp) #310.67[spill]
lea (%rbp,%rcx,8), %rax #327.30
addq %r8, %rax #327.30
lea (%rcx,%rdx), %r11d #322.13
movq %rax, 96(%rsp) #327.30[spill]
lea (%rcx,%rcx,2), %eax #327.30
movl %eax, 40(%rsp) #327.30[spill]
movl %ecx, %eax #320.9
shrl $1, %eax #320.9
lea (%rdx,%r15,2), %edx #322.35
movl %eax, 160(%rsp) #320.9[spill]
lea (%r11,%r15,2), %eax #280.19
movslq %eax, %rax #322.13
lea (%r8,%rcx,8), %rbp #321.35
movslq %edx, %rdx #322.35
shrl $1, %ebx #325.9
vmovsd %xmm3, 168(%rsp) #322.35[spill]
movl %edx, 56(%rsp) #322.35[spill]
lea (%r8,%rax,8), %r11 #322.13
movq %r11, 80(%rsp) #322.13[spill]
lea (%r8,%rdx,8), %r11 #322.35
movq %r11, 72(%rsp) #322.35[spill]
movl %eax, 64(%rsp) #322.35[spill]
movq %rdi, 200(%rsp) #322.35[spill]
movq %r8, 240(%rsp) #322.35[spill]
movl %r9d, 184(%rsp) #322.35[spill]
movq %r10, 208(%rsp) #322.35[spill]
movq %r12, 8(%rsp) #322.35[spill]
.cfi_offset 12, -312
movl %ecx, %r12d #322.35
movq %r13, 16(%rsp) #322.35[spill]
.cfi_offset 13, -304
xorl %r13d, %r13d #322.35
# LOE rbp r13 ebx esi r12d r14d r15d xmm1
..B4.3: # Preds ..B4.36 ..B4.2
# Execution count [2.62e+00]
incl %r14d #297.5
lea -1(%r14), %eax #330.9
cmpl 184(%rsp), %eax #297.36[spill]
jge ..B4.37 # Prob 20% #297.36
# LOE rbp r13 ebx esi r12d r14d r15d xmm1
..B4.4: # Preds ..B4.3
# Execution count [2.09e+00]
movl $1, %eax #299.9
xorl %esi, %esi #301.9
movq %r13, 264(%rsp) #298.9
movl %esi, 192(%rsp) #303.13[spill]
movq %rbp, 112(%rsp) #303.13[spill]
movl %ebx, 120(%rsp) #303.13[spill]
movl %r14d, 128(%rsp) #303.13[spill]
movl %r12d, 248(%rsp) #303.13[spill]
movl %eax, %r12d #303.13
movq 208(%rsp), %r13 #303.13[spill]
# LOE r13 r12d r15d
..B4.5: # Preds ..B4.41 ..B4.20 ..B4.4
# Execution count [4.19e+00]
movl 36(%r13), %r14d #303.13
movl $738197504, %edx #303.13
movl %edx, 136(%rsp) #303.13
movl %r12d, %ebx #302.13
movl %edx, 140(%rsp) #303.13
movl %edx, 144(%rsp) #303.13
lea 1(%r14), %ebp #303.13
movl %edx, 148(%rsp) #303.13
cmpl 40(%r13), %ebp #303.13
jge ..B4.9 # Prob 78% #303.13
# LOE r13 ebx ebp r12d r14d r15d
..B4.6: # Preds ..B4.5
# Execution count [9.21e-01]
movl 24(%r13), %esi #303.13
addq $-16, %rsp #303.13
.cfi_def_cfa_offset 336
movq 48(%r13), %rax #303.13
lea 152(%rsp), %r14 #303.13
movl $1275070475, %edx #303.13
movl %ebp, %ecx #303.13
movl $1, %r8d #303.13
lea 2(%rsi), %r10d #303.13
movq %r14, (%rsp) #303.13
movl $1140850688, %r9d #303.13
movl 32(%r13), %r14d #303.13
movl %r10d, 16(%rsp) #303.13[spill]
imull %r14d, %r10d #303.13
movslq %r10d, %r10 #303.13
movq %rax, 48(%rsp) #303.13[spill]
lea 8(%rax,%r10,8), %rdi #303.13
..___tag_value_solveRB.318:
# MPI_Isend(const void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Isend #303.13
..___tag_value_solveRB.319:
# LOE r13 ebx ebp r12d r14d r15d
..B4.46: # Preds ..B4.6
# Execution count [9.21e-01]
movq 48(%rsp), %rax #[spill]
# LOE rax r13 ebx ebp r12d r14d r15d
..B4.7: # Preds ..B4.46
# Execution count [9.21e-01]
incl %r14d #303.13
imull 16(%rsp), %r14d #303.13[spill]
movl $1275070475, %edx #303.13
movslq %r14d, %r14 #303.13
movl %ebp, %ecx #303.13
movl $2, %r8d #303.13
movl $1140850688, %r9d #303.13
movl 24(%r13), %esi #303.13
lea 156(%rsp), %r10 #303.13
movq %r10, (%rsp) #303.13
lea 8(%rax,%r14,8), %rdi #303.13
..___tag_value_solveRB.322:
# MPI_Irecv(void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Irecv #303.13
..___tag_value_solveRB.323:
# LOE r13 ebx r12d r15d
..B4.47: # Preds ..B4.7
# Execution count [9.21e-01]
addq $16, %rsp #303.13
.cfi_def_cfa_offset 320
# LOE r13 ebx r12d r15d
..B4.8: # Preds ..B4.47
# Execution count [9.21e-01]
movl 36(%r13), %r14d #303.13
# LOE r13 ebx r12d r14d r15d
..B4.9: # Preds ..B4.8 ..B4.5
# Execution count [4.19e+00]
testl %r14d, %r14d #303.13
jle ..B4.12 # Prob 40% #303.13
# LOE r13 ebx r12d r14d r15d
..B4.10: # Preds ..B4.9
# Execution count [2.50e+00]
addq $-16, %rsp #303.13
.cfi_def_cfa_offset 336
decl %r14d #303.13
movslq 24(%r13), %r10 #303.13
lea 160(%rsp), %rbp #303.13
movl $1275070475, %edx #303.13
movl %r14d, %ecx #303.13
movl $2, %r8d #303.13
movl $1140850688, %r9d #303.13
movq %rbp, (%rsp) #303.13
movq 48(%r13), %rbp #303.13
movl 24(%r13), %esi #303.13
lea 24(%rbp,%r10,8), %rdi #303.13
..___tag_value_solveRB.326:
# MPI_Isend(const void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Isend #303.13
..___tag_value_solveRB.327:
# LOE rbp r13 ebx r12d r14d r15d
..B4.11: # Preds ..B4.10
# Execution count [2.50e+00]
addq $8, %rbp #303.13
movq %rbp, %rdi #303.13
movl $1275070475, %edx #303.13
movl %r14d, %ecx #303.13
movl $1, %r8d #303.13
movl $1140850688, %r9d #303.13
lea 164(%rsp), %r10 #303.13
movl 24(%r13), %esi #303.13
movq %r10, (%rsp) #303.13
..___tag_value_solveRB.328:
# MPI_Irecv(void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Irecv #303.13
..___tag_value_solveRB.329:
# LOE r13 ebx r12d r15d
..B4.49: # Preds ..B4.11
# Execution count [2.50e+00]
addq $16, %rsp #303.13
.cfi_def_cfa_offset 320
# LOE r13 ebx r12d r15d
..B4.12: # Preds ..B4.49 ..B4.9
# Execution count [4.19e+00]
movl $4, %edi #303.13
lea 136(%rsp), %rsi #303.13
movl $1, %edx #303.13
..___tag_value_solveRB.331:
# MPI_Waitall(int, MPI_Request *, MPI_Status *)
call MPI_Waitall #303.13
..___tag_value_solveRB.332:
# LOE r13 ebx r12d r15d
..B4.13: # Preds ..B4.12
# Execution count [4.19e+00]
xorl %edx, %edx #305.13
xorl %eax, %eax #306.30
testl %r15d, %r15d #305.45
jle ..B4.41 # Prob 10% #305.45
# LOE r13 eax edx ebx r12d r15d
..B4.14: # Preds ..B4.13
# Execution count [3.77e+00]
movl %r12d, 256(%rsp) #[spill]
movq %r13, 208(%rsp) #[spill]
vmovsd .L_2il0floatpacket.8(%rip), %xmm0 #
vmovsd 232(%rsp), %xmm1 #[spill]
vmovsd 224(%rsp), %xmm2 #[spill]
vmovsd 216(%rsp), %xmm3 #[spill]
movq 200(%rsp), %r8 #[spill]
movq 240(%rsp), %rdi #[spill]
movl 248(%rsp), %r9d #[spill]
# LOE rdi r8 eax edx ebx r9d r15d xmm0 xmm1 xmm2 xmm3
..B4.15: # Preds ..B4.19 ..B4.14
# Execution count [2.09e+01]
xorl %r10d, %r10d #306.17
cmpl %r9d, %ebx #306.46
jg ..B4.19 # Prob 10% #306.46
# LOE rdi r8 eax edx ebx r9d r10d r15d xmm0 xmm1 xmm2 xmm3
..B4.16: # Preds ..B4.15
# Execution count [1.88e+01]
movslq %ebx, %rbx #308.32
movl %r9d, %ebp #278.21
subl %ebx, %ebp #278.21
lea (%r9,%rax), %r11d #308.32
addl $2, %ebp #278.21
lea (%rax,%r9,2), %r12d #310.37
shrl $1, %ebp #278.21
lea (%rdi,%rbx,8), %r13 #309.34
lea (%r8,%rbx,8), %rsi #308.32
.align 16,0x90
# LOE rsi rdi r8 r13 eax edx ebx ebp r9d r10d r11d r12d r15d xmm0 xmm1 xmm2 xmm3
..B4.17: # Preds ..B4.17 ..B4.16
# Execution count [1.05e+02]
lea (%r11,%r10,2), %ecx #310.57
movslq %ecx, %rcx #308.32
lea (%r12,%r10,2), %r14d #310.37
movslq %r14d, %r14 #310.37
vmovsd 16(%r13,%rcx,8), %xmm10 #310.57
vmulsd %xmm10, %xmm0, %xmm7 #310.57
vmovsd 24(%r13,%rcx,8), %xmm4 #309.34
vmovsd 32(%r13,%r14,8), %xmm6 #310.37
lea (%rax,%r10,2), %r14d #310.67
movslq %r14d, %r14 #310.67
incl %r10d #306.17
vsubsd %xmm7, %xmm4, %xmm5 #309.54
vsubsd %xmm7, %xmm6, %xmm8 #310.57
vaddsd 8(%r13,%rcx,8), %xmm5, %xmm12 #309.64
vaddsd (%r13,%r14,8), %xmm8, %xmm9 #310.67
vfnmadd213sd 16(%rsi,%rcx,8), %xmm3, %xmm12 #310.82
vfnmadd231sd %xmm2, %xmm9, %xmm12 #310.82
vfnmadd231sd %xmm1, %xmm12, %xmm10 #312.21
vmovsd %xmm10, 16(%r13,%rcx,8) #312.21
vmovsd 264(%rsp), %xmm11 #313.21
vfmadd213sd %xmm11, %xmm12, %xmm12 #313.21
vmovsd %xmm12, 264(%rsp) #313.21
cmpl %ebp, %r10d #306.17
jb ..B4.17 # Prob 82% #306.17
# LOE rsi rdi r8 r13 eax edx ebx ebp r9d r10d r11d r12d r15d xmm0 xmm1 xmm2 xmm3
..B4.19: # Preds ..B4.17 ..B4.15
# Execution count [2.09e+01]
negl %ebx #315.27
incl %edx #305.13
addl $3, %ebx #315.27
lea 2(%rax,%r9), %eax #305.13
cmpl %r15d, %edx #305.13
jb ..B4.15 # Prob 82% #305.13
# LOE rdi r8 eax edx ebx r9d r15d xmm0 xmm1 xmm2 xmm3
..B4.20: # Preds ..B4.19
# Execution count [3.77e+00]
movl 256(%rsp), %r12d #[spill]
movl 192(%rsp), %edx #301.9[spill]
negl %r12d #317.23
incl %edx #301.9
addl $3, %r12d #317.23
movq 208(%rsp), %r13 #[spill]
movl %edx, 192(%rsp) #301.9[spill]
cmpl $2, %edx #301.9
jb ..B4.5 # Prob 50% #301.9
# LOE r13 r12d r15d
..B4.21: # Preds ..B4.20
# Execution count [1.88e+00]
movl 248(%rsp), %r12d #[spill]
movq 112(%rsp), %rbp #[spill]
movl 120(%rsp), %ebx #[spill]
movl 128(%rsp), %r14d #[spill]
movq %r13, 208(%rsp) #[spill]
xorl %r13d, %r13d #
testl %r12d, %r12d #320.36
jle ..B4.29 # Prob 50% #320.36
# LOE rbp r13 ebx r12d r14d r15d
..B4.22: # Preds ..B4.21 ..B4.42
# Execution count [2.09e+00]
movl $1, %edx #320.9
xorl %esi, %esi #320.9
cmpl $0, 160(%rsp) #320.9[spill]
je ..B4.26 # Prob 10% #320.9
# LOE rbp r13 edx ebx esi r12d r14d r15d
..B4.23: # Preds ..B4.22
# Execution count [1.88e+00]
movl 56(%rsp), %r9d #[spill]
movl 64(%rsp), %r8d #[spill]
movl 160(%rsp), %edi #[spill]
movq 240(%rsp), %rcx #[spill]
.align 16,0x90
# LOE rcx rbp r13 ebx esi edi r8d r9d r12d r14d r15d
..B4.24: # Preds ..B4.24 ..B4.23
# Execution count [5.23e+00]
movslq %esi, %r10 #321.35
lea (%r9,%rsi,2), %eax #280.19
shlq $4, %r10 #321.35
lea (%r8,%rsi,2), %edx #280.19
movslq %eax, %rax #322.35
incl %esi #320.9
movslq %edx, %rdx #322.13
movq 24(%rbp,%r10), %r11 #321.35
movq %r11, 8(%rcx,%r10) #321.13
movq 8(%rcx,%rax,8), %r11 #322.35
movq %r11, 24(%rcx,%rdx,8) #322.13
movq 32(%rbp,%r10), %r11 #321.35
movq %r11, 16(%rcx,%r10) #321.13
movq 16(%rcx,%rax,8), %r10 #322.35
movq %r10, 32(%rcx,%rdx,8) #322.13
cmpl %edi, %esi #320.9
jb ..B4.24 # Prob 64% #320.9
# LOE rcx rbp r13 ebx esi edi r8d r9d r12d r14d r15d
..B4.25: # Preds ..B4.24
# Execution count [1.88e+00]
lea 1(%rsi,%rsi), %edx #321.13
# LOE rbp r13 edx ebx r12d r14d r15d
..B4.26: # Preds ..B4.25 ..B4.22
# Execution count [2.09e+00]
lea -1(%rdx), %eax #320.9
cmpl %r12d, %eax #320.9
jae ..B4.28 # Prob 10% #320.9
# LOE rbp r13 edx ebx r12d r14d r15d
..B4.27: # Preds ..B4.26
# Execution count [1.88e+00]
movslq %edx, %rdx #321.35
movq 240(%rsp), %rsi #321.13[spill]
movq 72(%rsp), %rdi #322.35[spill]
movq 80(%rsp), %r9 #322.13[spill]
movq 16(%rbp,%rdx,8), %rax #321.35
movq %rax, (%rsi,%rdx,8) #321.13
movq (%rdi,%rdx,8), %r8 #322.35
movq %r8, 16(%r9,%rdx,8) #322.13
# LOE rbp r13 ebx r12d r14d r15d
..B4.28: # Preds ..B4.26 ..B4.27
# Execution count [1.05e+00]
testl %r15d, %r15d #325.41
jle ..B4.35 # Prob 50% #325.41
# LOE rbp r13 ebx r12d r14d r15d
..B4.29: # Preds ..B4.21 ..B4.28
# Execution count [2.09e+00]
xorl %edi, %edi #325.9
movl $1, %esi #325.9
xorl %edx, %edx #326.13
testl %ebx, %ebx #325.9
je ..B4.33 # Prob 10% #325.9
# LOE rbp r13 edx ebx esi edi r12d r14d r15d
..B4.30: # Preds ..B4.29
# Execution count [1.88e+00]
movl 48(%rsp), %esi #[spill]
movl 40(%rsp), %ecx #[spill]
movq 240(%rsp), %rax #[spill]
.align 16,0x90
# LOE rax rbp r13 edx ecx ebx esi edi r12d r14d r15d
..B4.31: # Preds ..B4.31 ..B4.30
# Execution count [5.23e+00]
movl %edx, %r8d #326.30
lea (%rdx,%r12,2), %r11d #327.30
subl %r12d, %r8d #326.30
incl %edi #325.9
movslq %r11d, %r11 #327.30
lea (%r8,%r12,2), %r9d #326.30
movslq %r9d, %r9 #326.30
movq 24(%rax,%r9,8), %r10 #326.30
movq %r10, 16(%rax,%r9,8) #326.13
lea (%rcx,%rdx), %r10d #310.67
movq 16(%rax,%r11,8), %r8 #327.30
addl %esi, %edx #325.9
movslq %r10d, %r10 #327.30
movq %r8, 24(%rax,%r11,8) #327.13
movq 40(%rax,%r11,8), %r9 #326.30
movq %r9, 32(%rax,%r11,8) #326.13
movq 32(%rax,%r10,8), %r8 #327.30
movq %r8, 40(%rax,%r10,8) #327.13
cmpl %ebx, %edi #325.9
jb ..B4.31 # Prob 64% #325.9
# LOE rax rbp r13 edx ecx ebx esi edi r12d r14d r15d
..B4.32: # Preds ..B4.31
# Execution count [1.88e+00]
lea 1(%rdi,%rdi), %esi #326.13
# LOE rbp r13 ebx esi r12d r14d r15d
..B4.33: # Preds ..B4.32 ..B4.29
# Execution count [2.09e+00]
lea -1(%rsi), %eax #325.9
cmpl %r15d, %eax #325.9
jae ..B4.35 # Prob 10% #325.9
# LOE rbp r13 ebx esi r12d r14d r15d
..B4.34: # Preds ..B4.33
# Execution count [1.88e+00]
imull 88(%rsp), %esi #326.30[spill]
addl 104(%rsp), %esi #326.30[spill]
movslq %esi, %rsi #326.30
movq 96(%rsp), %rdi #327.30[spill]
movq 8(%rbp,%rsi,8), %rax #326.30
movq %rax, (%rbp,%rsi,8) #326.13
movq (%rdi,%rsi,8), %rdx #327.30
movq %rdx, 8(%rdi,%rsi,8) #327.13
# LOE rbp r13 ebx r12d r14d r15d
..B4.35: # Preds ..B4.33 ..B4.28 ..B4.42 ..B4.34
# Execution count [2.09e+00]
movl $1, %edx #329.9
lea 264(%rsp), %rdi #329.9
movl $1275070475, %ecx #329.9
lea 152(%rsp), %rsi #329.9
movl $1476395011, %r8d #329.9
movl $1140850688, %r9d #329.9
..___tag_value_solveRB.364:
# MPI_Allreduce(const void *, void *, int, MPI_Datatype, MPI_Op, MPI_Comm)
call MPI_Allreduce #329.9
..___tag_value_solveRB.365:
# LOE rbp r13 ebx r12d r14d r15d
..B4.36: # Preds ..B4.35
# Execution count [2.09e+00]
vmovsd 152(%rsp), %xmm0 #330.15
movl %r14d, %esi #335.9
vdivsd 168(%rsp), %xmm0, %xmm1 #331.37[spill]
vcomisd 176(%rsp), %xmm1 #297.20[spill]
jae ..B4.3 # Prob 82% #297.20
# LOE rbp r13 ebx esi r12d r14d r15d xmm1
..B4.37: # Preds ..B4.3 ..B4.36
# Execution count [3.77e-01]
vmovsd 24(%rsp), %xmm0 #[spill]
movq 208(%rsp), %r10 #[spill]
movq 8(%rsp), %r12 #[spill]
.cfi_restore 12
movq 16(%rsp), %r13 #[spill]
.cfi_restore 13
# LOE r10 r12 r13 esi xmm0 xmm1
..B4.38: # Preds ..B4.37 ..B4.1
# Execution count [1.00e+00]
cmpl $0, 36(%r10) #338.25
jne ..B4.40 # Prob 78% #338.25
# LOE r12 r13 esi xmm0 xmm1
..B4.39: # Preds ..B4.38
# Execution count [2.20e-01]
movl $.L_2__STRING.6, %edi #339.9
xorl %eax, %eax #339.9
vmovsd %xmm1, 264(%rsp) #295.5
vmovsd %xmm1, (%rsp) #339.9[spill]
vmovsd %xmm0, 24(%rsp) #339.9[spill]
..___tag_value_solveRB.375:
# printf(const char *__restrict__, ...)
call printf #339.9
..___tag_value_solveRB.376:
# LOE r12 r13
..B4.50: # Preds ..B4.39
# Execution count [2.20e-01]
vmovsd 24(%rsp), %xmm0 #[spill]
vmovsd (%rsp), %xmm1 #[spill]
# LOE r12 r13 xmm0 xmm1
..B4.40: # Preds ..B4.50 ..B4.38
# Execution count [1.00e+00]
vcmpgtsd %xmm1, %xmm0, %xmm0 #342.16
vmovd %xmm0, %eax #342.16
negl %eax #342.16
addq $280, %rsp #342.16
.cfi_def_cfa_offset 40
.cfi_restore 6
popq %rbp #342.16
.cfi_def_cfa_offset 32
.cfi_restore 3
popq %rbx #342.16
.cfi_def_cfa_offset 24
.cfi_restore 15
popq %r15 #342.16
.cfi_def_cfa_offset 16
.cfi_restore 14
popq %r14 #342.16
.cfi_def_cfa_offset 8
ret #342.16
.cfi_def_cfa_offset 320
.cfi_offset 3, -32
.cfi_offset 6, -40
.cfi_offset 12, -312
.cfi_offset 13, -304
.cfi_offset 14, -16
.cfi_offset 15, -24
# LOE
..B4.41: # Preds ..B4.13
# Execution count [4.19e-01]: Infreq
movl 192(%rsp), %edx #301.9[spill]
negl %r12d #317.23
incl %edx #301.9
addl $3, %r12d #317.23
movl %edx, 192(%rsp) #301.9[spill]
cmpl $2, %edx #301.9
jb ..B4.5 # Prob 50% #301.9
# LOE r13 r12d r15d
..B4.42: # Preds ..B4.41
# Execution count [2.09e-01]: Infreq
movl 248(%rsp), %r12d #[spill]
movq 112(%rsp), %rbp #[spill]
movl 120(%rsp), %ebx #[spill]
movl 128(%rsp), %r14d #[spill]
movq %r13, 208(%rsp) #[spill]
xorl %r13d, %r13d #
testl %r12d, %r12d #320.36
jg ..B4.22 # Prob 50% #320.36
jmp ..B4.35 # Prob 100% #320.36
.align 16,0x90
# LOE rbp r13 ebx r12d r14d r15d
.cfi_endproc
# mark_end;
.type solveRB,@function
.size solveRB,.-solveRB
..LNsolveRB.3:
.data
# -- End solveRB
.text
.L_2__routine_start_solveRBA_4:
# -- Begin solveRBA
.text
# mark_begin;
.align 16,0x90
.globl solveRBA
# --- solveRBA(Solver *)
solveRBA:
# parameter 1: %rdi
..B5.1: # Preds ..B5.0
# Execution count [1.00e+00]
.cfi_startproc
..___tag_value_solveRBA.404:
..L405:
#349.1
pushq %rbp #349.1
.cfi_def_cfa_offset 16
movq %rsp, %rbp #349.1
.cfi_def_cfa 6, 16
.cfi_offset 6, -16
andq $-64, %rsp #349.1
pushq %r12 #349.1
pushq %r13 #349.1
pushq %r14 #349.1
pushq %r15 #349.1
pushq %rbx #349.1
subq $472, %rsp #349.1
.cfi_escape 0x10, 0x03, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf0, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0f, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x22
xorl %ebx, %ebx #351.12
vmovsd 72(%rdi), %xmm0 #358.21
vmovsd (%rdi), %xmm5 #361.21
vmovsd .L_2il0floatpacket.5(%rip), %xmm9 #365.29
vmulsd %xmm5, %xmm5, %xmm3 #361.34
vmulsd %xmm9, %xmm0, %xmm2 #365.29
vmovsd 8(%rdi), %xmm1 #362.21
vmulsd %xmm1, %xmm1, %xmm7 #362.34
vmulsd %xmm3, %xmm2, %xmm4 #365.42
vmovsd 64(%rdi), %xmm8 #357.21
vmovsd .L_2il0floatpacket.9(%rip), %xmm17 #363.27
vmulsd %xmm8, %xmm8, %xmm1 #370.26
vaddsd %xmm17, %xmm8, %xmm2 #372.17
vdivsd %xmm7, %xmm17, %xmm15 #364.27
vmulsd %xmm7, %xmm4, %xmm6 #365.42
vfmadd231sd %xmm5, %xmm5, %xmm7 #365.56
vdivsd %xmm3, %xmm17, %xmm16 #363.27
movq 56(%rdi), %rax #367.21
movl 24(%rdi), %ecx #354.21
movl 28(%rdi), %r8d #355.21
movl 32(%rdi), %r13d #356.21
movl 88(%rdi), %r12d #359.21
movq 48(%rdi), %rdx #366.21
vmovsd 80(%rdi), %xmm4 #369.20
movq %rdi, 376(%rsp) #349.1[spill]
vdivsd %xmm7, %xmm6, %xmm14 #365.56
movq %rax, 320(%rsp) #367.21[spill]
vcomisd %xmm1, %xmm2 #374.20
jb ..B5.58 # Prob 10% #374.20
# LOE rdx ecx ebx r8d r12d r13d xmm0 xmm1 xmm2 xmm4 xmm9 xmm14 xmm15 xmm16 xmm17
..B5.2: # Preds ..B5.1
# Execution count [9.00e-01]
vmulsd %xmm4, %xmm9, %xmm3 #395.64
movl %r13d, %edi #404.9
imull %ecx, %r8d #409.37
vmulsd .L_2il0floatpacket.10(%rip), %xmm4, %xmm5 #396.65
vmovups .L_2il0floatpacket.11(%rip), %zmm9 #386.34
vmovups .L_2il0floatpacket.12(%rip), %zmm8 #386.34
vfnmadd213sd %xmm17, %xmm4, %xmm3 #395.70
vmovups .L_2il0floatpacket.13(%rip), %zmm7 #386.48
vmulsd %xmm5, %xmm4, %xmm12 #396.71
vmovdqu .L_2il0floatpacket.6(%rip), %ymm5 #383.17
vmovdqu .L_2il0floatpacket.7(%rip), %ymm4 #383.17
vdivsd %xmm3, %xmm17, %xmm13 #395.70
movslq %ecx, %rcx #385.32
vxorpd %xmm3, %xmm3, %xmm3 #409.37
vbroadcastsd %xmm16, %zmm10 #363.19
lea (%rcx,%rcx,2), %r15d #406.30
vbroadcastsd %xmm15, %zmm6 #364.19
vmovsd .L_2il0floatpacket.8(%rip), %xmm11 #386.48
vmovsd %xmm0, 360(%rsp) #401.35[spill]
movl %r15d, 56(%rsp) #406.30[spill]
movl %ecx, %r15d #356.19
imull %r13d, %r15d #356.19
lea 2(%rcx), %r14d #387.67
vmovsd %xmm12, 312(%rsp) #401.35[spill]
vmovsd %xmm13, 40(%rsp) #401.35[spill]
vmovsd %xmm14, 352(%rsp) #401.35[spill]
vmovsd %xmm15, 336(%rsp) #401.35[spill]
movl %r14d, 208(%rsp) #387.67[spill]
lea (%rcx,%r15), %r14d #401.13
movl %ecx, %r10d #405.30
lea (%r14,%r13,2), %esi #356.19
movslq %esi, %rsi #401.13
lea (%r15,%r13,2), %r15d #401.35
movslq %r15d, %r15 #401.35
negl %r10d #405.30
vcvtsi2sd %r8d, %xmm3, %xmm3 #409.37
vmovups %zmm6, 64(%rsp) #401.35[spill]
vmovups %zmm10, 128(%rsp) #401.35[spill]
vmovsd %xmm16, 344(%rsp) #401.35[spill]
movl %r10d, 216(%rsp) #405.30[spill]
lea (,%rcx,8), %r8 #400.35
movl %ecx, %r10d #399.9
lea (%r8,%rcx,8), %r8 #406.30
shrl $1, %edi #404.9
lea 4(%rcx,%rcx), %eax #387.67
movq %rcx, 416(%rsp) #385.32[spill]
xorl %r11d, %r11d #374.5
movl %eax, 48(%rsp) #387.67[spill]
addq %rdx, %r8 #406.30
shrl $1, %r10d #399.9
lea (%rdx,%rcx,8), %r9 #400.35
movl %r15d, 192(%rsp) #401.35[spill]
lea (%rdx,%rsi,8), %r14 #401.13
movl %esi, 200(%rsp) #401.35[spill]
lea (%rdx,%r15,8), %rax #401.35
# LOE rax rdx r8 r9 r14 ecx ebx edi r10d r11d r12d r13d xmm1 xmm2 xmm3
..B5.3: # Preds ..B5.56 ..B5.2
# Execution count [2.62e+00]
incl %r11d #374.5
lea -1(%r11), %r15d #409.9
cmpl %r12d, %r15d #374.36
jge ..B5.57 # Prob 20% #374.36
# LOE rax rdx r8 r9 r14 ecx ebx edi r10d r11d r12d r13d xmm1 xmm2 xmm3
..B5.4: # Preds ..B5.3
# Execution count [2.09e+00]
xorb %r15b, %r15b #378.9
movl $1, %ebx #376.9
vxorpd %xmm0, %xmm0, %xmm0 #375.9
vmovsd %xmm0, 328(%rsp) #380.13[spill]
vmovsd %xmm3, 304(%rsp) #380.13[spill]
vmovsd %xmm1, 296(%rsp) #380.13[spill]
movb %r15b, 392(%rsp) #380.13[spill]
movq %rax, 248(%rsp) #380.13[spill]
movq %r14, 256(%rsp) #380.13[spill]
movl %r10d, 264(%rsp) #380.13[spill]
movq %r9, 272(%rsp) #380.13[spill]
movq %r8, 280(%rsp) #380.13[spill]
movl %edi, 288(%rsp) #380.13[spill]
movl %r11d, 384(%rsp) #380.13[spill]
movq %rdx, 408(%rsp) #380.13[spill]
movl %r12d, 240(%rsp) #380.13[spill]
movl %ecx, 400(%rsp) #380.13[spill]
# LOE ebx r13d
..B5.5: # Preds ..B5.41 ..B5.4
# Execution count [4.19e+00]
movq 376(%rsp), %rax #380.13[spill]
movl $738197504, %r12d #380.13
movl %r12d, 224(%rsp) #380.13
movl %r12d, 228(%rsp) #380.13
movl 36(%rax), %r15d #380.13
movl %r12d, 232(%rsp) #380.13
movl %r12d, 236(%rsp) #380.13
movl %ebx, %r12d #379.13
lea 1(%r15), %r14d #380.13
cmpl 40(%rax), %r14d #380.13
jge ..B5.9 # Prob 78% #380.13
# LOE rax ebx r12d r13d r14d r15d
..B5.6: # Preds ..B5.5
# Execution count [9.21e-01]
addq $-16, %rsp #380.13
movl $1275070475, %edx #380.13
movl %r14d, %ecx #380.13
lea 240(%rsp), %r15 #380.13
movl $1, %r8d #380.13
movl $1140850688, %r9d #380.13
movq %r15, (%rsp) #380.13
vzeroupper #380.13
movl 24(%rax), %esi #380.13
movl 32(%rax), %r15d #380.13
movq 48(%rax), %rax #380.13
movq %rax, 48(%rsp) #380.13[spill]
lea 2(%rsi), %r10d #380.13
movl %r10d, 40(%rsp) #380.13[spill]
imull %r15d, %r10d #380.13
movslq %r10d, %r10 #380.13
lea 8(%rax,%r10,8), %rdi #380.13
..___tag_value_solveRBA.448:
# MPI_Isend(const void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Isend #380.13
..___tag_value_solveRBA.449:
# LOE ebx r12d r13d r14d r15d
..B5.65: # Preds ..B5.6
# Execution count [9.21e-01]
movq 48(%rsp), %rax #[spill]
# LOE rax ebx r12d r13d r14d r15d
..B5.7: # Preds ..B5.65
# Execution count [9.21e-01]
incl %r15d #380.13
imull 40(%rsp), %r15d #380.13[spill]
movl $1275070475, %edx #380.13
movslq %r15d, %r15 #380.13
movl %r14d, %ecx #380.13
movl $2, %r8d #380.13
movl $1140850688, %r9d #380.13
lea 8(%rax,%r15,8), %rdi #380.13
lea 244(%rsp), %rax #380.13
movq %rax, (%rsp) #380.13
movq 148(%rax), %r10 #380.13[spill]
movl 24(%r10), %esi #380.13
..___tag_value_solveRBA.453:
# MPI_Irecv(void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Irecv #380.13
..___tag_value_solveRBA.454:
# LOE ebx r12d r13d
..B5.66: # Preds ..B5.7
# Execution count [9.21e-01]
addq $16, %rsp #380.13
# LOE ebx r12d r13d
..B5.8: # Preds ..B5.66
# Execution count [9.21e-01]
movq 376(%rsp), %rax #380.13[spill]
movl 36(%rax), %r15d #380.13
# LOE rax ebx r12d r13d r15d
..B5.9: # Preds ..B5.8 ..B5.5
# Execution count [4.19e+00]
testl %r15d, %r15d #380.13
jle ..B5.12 # Prob 40% #380.13
# LOE rax ebx r12d r13d r15d
..B5.10: # Preds ..B5.9
# Execution count [2.50e+00]
addq $-16, %rsp #380.13
decl %r15d #380.13
movl $1275070475, %edx #380.13
lea 248(%rsp), %r14 #380.13
movl %r15d, %ecx #380.13
movl $2, %r8d #380.13
movl $1140850688, %r9d #380.13
movq %r14, (%rsp) #380.13
movq %rax, %r10 #380.13
vzeroupper #380.13
movq 48(%r10), %r14 #380.13
movslq 24(%r10), %rax #380.13
movl 24(%r10), %esi #380.13
lea 24(%r14,%rax,8), %rdi #380.13
..___tag_value_solveRBA.456:
# MPI_Isend(const void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Isend #380.13
..___tag_value_solveRBA.457:
# LOE r14 ebx r12d r13d r15d
..B5.11: # Preds ..B5.10
# Execution count [2.50e+00]
addq $8, %r14 #380.13
movq %r14, %rdi #380.13
lea 252(%rsp), %rax #380.13
movl $1275070475, %edx #380.13
movl %r15d, %ecx #380.13
movl $1, %r8d #380.13
movl $1140850688, %r9d #380.13
movq %rax, (%rsp) #380.13
movq 140(%rax), %r10 #380.13[spill]
movl 24(%r10), %esi #380.13
..___tag_value_solveRBA.459:
# MPI_Irecv(void *, int, MPI_Datatype, int, int, MPI_Comm, MPI_Request *)
call MPI_Irecv #380.13
..___tag_value_solveRBA.460:
# LOE ebx r12d r13d
..B5.68: # Preds ..B5.11
# Execution count [2.50e+00]
addq $16, %rsp #380.13
# LOE ebx r12d r13d
..B5.12: # Preds ..B5.68 ..B5.9
# Execution count [4.19e+00]
movl $4, %edi #380.13
lea 224(%rsp), %rsi #380.13
movl $1, %edx #380.13
vzeroupper #380.13
..___tag_value_solveRBA.461:
# MPI_Waitall(int, MPI_Request *, MPI_Status *)
call MPI_Waitall #380.13
..___tag_value_solveRBA.462:
# LOE ebx r12d r13d
..B5.13: # Preds ..B5.12
# Execution count [4.19e+00]
xorl %r14d, %r14d #382.13
testl %r13d, %r13d #382.45
jle ..B5.37 # Prob 10% #382.45
# LOE ebx r12d r13d r14d
..B5.14: # Preds ..B5.13
# Execution count [3.77e+00]
vmovsd 360(%rsp), %xmm0 #389.41[spill]
vmulsd 352(%rsp), %xmm0, %xmm11 #389.41[spill]
vmovups 64(%rsp), %zmm5 #389.41[spill]
vmovups 128(%rsp), %zmm1 #389.41[spill]
vmovdqu .L_2il0floatpacket.7(%rip), %ymm8 #389.41
vmovdqu .L_2il0floatpacket.6(%rip), %ymm12 #389.41
vmovsd 328(%rsp), %xmm6 #389.41[spill]
vmovsd 336(%rsp), %xmm13 #389.41[spill]
vmovsd 344(%rsp), %xmm7 #389.41[spill]
vmovsd .L_2il0floatpacket.8(%rip), %xmm9 #389.41
vbroadcastsd %xmm11, %zmm0 #389.41
vmovups .L_2il0floatpacket.13(%rip), %zmm4 #389.41
vmovups .L_2il0floatpacket.12(%rip), %zmm3 #389.41
vmovups .L_2il0floatpacket.11(%rip), %zmm2 #389.41
movl %ebx, 368(%rsp) #389.41[spill]
movq 320(%rsp), %r10 #389.41[spill]
movq 408(%rsp), %rdi #389.41[spill]
movl 400(%rsp), %r9d #389.41[spill]
# LOE rdi r10 r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.15: # Preds ..B5.35 ..B5.14
# Execution count [2.09e+01]
cmpl %r9d, %r12d #383.46
jg ..B5.35 # Prob 50% #383.46
# LOE rdi r10 r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.16: # Preds ..B5.15
# Execution count [0.00e+00]
movq 416(%rsp), %rax #387.67[spill]
movl %r9d, %ecx #354.21
movslq %r14d, %r14 #385.32
subl %r12d, %ecx #354.21
movslq %r12d, %r11 #385.32
lea 2(%rax), %rdx #387.67
imulq %r14, %rdx #385.32
lea (%rax,%r11), %rbx #385.32
addq %rdx, %rbx #385.32
lea 8(%rdi,%rbx,8), %rsi #386.64
movq %rsi, 8(%rsp) #386.64[spill]
lea 16(%r10,%rbx,8), %rax #385.32
negq %rax #385.32
lea 2(%rcx), %ebx #354.21
movl %ebx, %r8d #383.17
addq %rsi, %rax #385.32
shrl $31, %r8d #383.17
lea 2(%rcx,%r8), %esi #354.21
sarl $1, %esi #354.21
movslq %esi, %r15 #354.21
shlq $4, %r15 #383.17
movq %r15, 16(%rsp) #383.17[spill]
lea -8(%r15), %rcx #383.17
movq %rcx, (%rsp) #383.17[spill]
cmpq %rcx, %rax #383.17
jge ..B5.18 # Prob 50% #383.17
# LOE rax rdx rdi r10 r11 r15 ebx esi r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.17: # Preds ..B5.16
# Execution count [0.00e+00]
movq %r15, %rcx #383.17
negq %rax #386.64
lea 8(%rcx), %r8 #383.17
cmpq %r8, %rax #383.17
jl ..B5.31 # Prob 50% #383.17
# LOE rdx rdi r10 r11 r15 ebx esi r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.18: # Preds ..B5.16 ..B5.17
# Execution count [0.00e+00]
movl 208(%rsp), %r8d #387.37[spill]
imull %r14d, %r8d #387.37
lea (%r8,%r9,2), %eax #387.37
movl %eax, 432(%rsp) #387.37[spill]
cltq #387.37
addq %r11, %rax #387.37
lea 32(%rdi,%rax,8), %rcx #387.37
negq %rcx #387.37
addq 8(%rsp), %rcx #387.37[spill]
cmpq (%rsp), %rcx #383.17[spill]
jge ..B5.20 # Prob 50% #383.17
# LOE rdx rcx rdi r10 r11 r15 ebx esi r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.19: # Preds ..B5.18
# Execution count [0.00e+00]
movq %r15, %rax #383.17
negq %rcx #386.64
lea 8(%rax), %r15 #383.17
cmpq %r15, %rcx #383.17
jl ..B5.32 # Prob 50% #383.17
# LOE rdx rdi r10 r11 ebx esi r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.20: # Preds ..B5.18 ..B5.19
# Execution count [0.00e+00]
addq %r11, %rdx #387.67
lea (%rdi,%rdx,8), %rax #387.67
movq 8(%rsp), %rdx #387.67[spill]
subq %rax, %rdx #387.67
movq %rdx, 8(%rsp) #387.67[spill]
cmpq (%rsp), %rdx #383.17[spill]
jge ..B5.22 # Prob 50% #383.17
# LOE rdx rdi r10 r11 ebx esi r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.21: # Preds ..B5.20
# Execution count [0.00e+00]
movq %rdx, %rax #386.64
movq 16(%rsp), %rdx #383.17[spill]
negq %rax #386.64
addq $8, %rdx #383.17
cmpq %rdx, %rax #383.17
jl ..B5.32 # Prob 50% #383.17
# LOE rdi r10 r11 ebx esi r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.22: # Preds ..B5.20 ..B5.21
# Execution count [9.42e+00]
vpxord %zmm10, %zmm10, %zmm10 #390.21
vmovaps %zmm10, %zmm14 #390.21
cmpl $16, %esi #383.17
jl ..B5.61 # Prob 10% #383.17
# LOE rdi r10 r11 esi r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5 zmm10 zmm14
..B5.23: # Preds ..B5.22
# Execution count [9.42e+00]
movslq %r12d, %r12 #386.64
lea (%rdi,%r11,8), %rbx #386.54
movl $85, %eax #385.32
lea (%r10,%r11,8), %r15 #385.32
movslq %r8d, %r11 #386.64
xorl %edx, %edx #383.17
addq %r12, %r11 #386.64
lea (%r9,%r8), %ecx #385.32
addq 416(%rsp), %r11 #386.64[spill]
kmovw %eax, %k1 #385.32
movl %esi, %eax #383.17
vmovdqu32 .L_2il0floatpacket.14(%rip), %zmm23 #385.32
vmovdqu32 .L_2il0floatpacket.15(%rip), %zmm24 #385.32
vmovdqu32 .L_2il0floatpacket.16(%rip), %zmm26 #385.32
movl %r13d, 424(%rsp) #366.21[spill]
andl $-16, %eax #383.17
movl 432(%rsp), %r9d #366.21[spill]
lea (%rdi,%r11,8), %r11 #366.21
# LOE rbx r10 r11 r15 eax edx ecx esi r8d r9d r12d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5 zmm10 zmm14 zmm23 zmm24 zmm26 k1
..B5.24: # Preds ..B5.24 ..B5.23
# Execution count [5.23e+01]
vmovupd 16(%r11), %zmm19 #386.34
lea (%rcx,%rdx,2), %edi #385.32
vmovupd 80(%r11), %zmm27 #386.34
vmovupd 144(%r11), %zmm20 #386.34
vmovupd 208(%r11), %zmm30 #386.34
vmovupd 8(%r11), %zmm25 #386.34
vmovupd 72(%r11), %zmm18 #386.34
vmovupd 136(%r11), %zmm17 #386.34
vmovaps %zmm2, %zmm22 #386.34
lea (%r9,%rdx,2), %r13d #387.37
vpermi2pd %zmm27, %zmm19, %zmm22 #386.34
vpermt2pd %zmm27, %zmm3, %zmm19 #386.34
vmovupd 200(%r11), %zmm27 #386.34
vfnmadd231pd %zmm22, %zmm4, %zmm19 #386.54
movslq %edi, %rdi #385.32
addq $256, %r11 #383.17
vmovaps %zmm2, %zmm15 #386.34
vmovaps %zmm2, %zmm31 #386.64
vpermi2pd %zmm30, %zmm20, %zmm15 #386.34
vpermt2pd %zmm30, %zmm3, %zmm20 #386.34
vpermi2pd %zmm18, %zmm25, %zmm31 #386.64
vpermt2pd %zmm18, %zmm3, %zmm25 #386.64
vmovupd 16(%r15,%rdi,8), %zmm21{%k1}{z} #385.32
vmovupd 80(%r15,%rdi,8), %zmm28{%k1}{z} #385.32
vmovupd 144(%r15,%rdi,8), %zmm16{%k1}{z} #385.32
vmovupd 208(%r15,%rdi,8), %zmm29{%k1}{z} #385.32
vfnmadd231pd %zmm4, %zmm15, %zmm20 #386.54
vaddpd %zmm31, %zmm19, %zmm18 #386.64
vpermt2pd %zmm28, %zmm23, %zmm21 #385.32
vpermt2pd %zmm29, %zmm23, %zmm16 #385.32
vfmsub231pd %zmm1, %zmm18, %zmm21 #387.82
vmovaps %zmm2, %zmm19 #386.64
movslq %r13d, %r13 #387.37
vpermi2pd %zmm27, %zmm17, %zmm19 #386.64
vpermt2pd %zmm27, %zmm3, %zmm17 #386.64
vmovupd 32(%rbx,%r13,8), %zmm18{%k1}{z} #387.37
vmovupd 96(%rbx,%r13,8), %zmm28{%k1}{z} #387.37
vmovupd 224(%rbx,%r13,8), %zmm29{%k1}{z} #387.37
vaddpd %zmm19, %zmm20, %zmm20 #386.64
vpermt2pd %zmm28, %zmm23, %zmm18 #387.37
vmovupd 160(%rbx,%r13,8), %zmm19{%k1}{z} #387.37
vfmsub231pd %zmm1, %zmm20, %zmm16 #387.82
vpermt2pd %zmm29, %zmm23, %zmm19 #387.37
lea (%r8,%rdx,2), %r13d #387.67
addl $16, %edx #383.17
movslq %r13d, %r13 #387.67
vmovupd (%rbx,%r13,8), %zmm29{%k1}{z} #387.67
vmovupd 64(%rbx,%r13,8), %zmm30{%k1}{z} #387.67
vpermt2pd %zmm30, %zmm23, %zmm29 #387.67
vfmsub213pd %zmm29, %zmm4, %zmm22 #387.82
vsubpd %zmm18, %zmm22, %zmm22 #387.82
vmovupd 128(%rbx,%r13,8), %zmm18{%k1}{z} #387.67
vfmsub213pd %zmm21, %zmm5, %zmm22 #387.82
vmovupd 192(%rbx,%r13,8), %zmm21{%k1}{z} #387.67
vfnmadd231pd %zmm22, %zmm0, %zmm25 #389.21
vfmadd231pd %zmm22, %zmm22, %zmm10 #390.21
vpermt2pd %zmm21, %zmm23, %zmm18 #387.67
vfmsub231pd %zmm4, %zmm15, %zmm18 #387.82
vsubpd %zmm19, %zmm18, %zmm18 #387.82
vfmsub213pd %zmm16, %zmm5, %zmm18 #387.82
vpermpd %zmm25, %zmm24, %zmm16 #389.21
vpermpd %zmm25, %zmm26, %zmm25 #389.21
vfnmadd231pd %zmm18, %zmm0, %zmm17 #389.21
vmovupd %zmm16, 16(%rbx,%rdi,8){%k1} #389.21
vmovupd %zmm25, 80(%rbx,%rdi,8){%k1} #389.21
vfmadd231pd %zmm18, %zmm18, %zmm14 #390.21
vpermpd %zmm17, %zmm24, %zmm15 #389.21
vpermpd %zmm17, %zmm26, %zmm17 #389.21
vmovupd %zmm15, 144(%rbx,%rdi,8){%k1} #389.21
vmovupd %zmm17, 208(%rbx,%rdi,8){%k1} #389.21
cmpl %eax, %edx #383.17
jb ..B5.24 # Prob 82% #383.17
# LOE rbx r10 r11 r15 eax edx ecx esi r8d r9d r12d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5 zmm10 zmm14 zmm23 zmm24 zmm26 k1
..B5.25: # Preds ..B5.24
# Execution count [9.42e+00]
movq 408(%rsp), %rdi #[spill]
movl 424(%rsp), %r13d #[spill]
movl 400(%rsp), %r9d #[spill]
# LOE rdi r10 eax esi r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5 zmm10 zmm14
..B5.26: # Preds ..B5.25 ..B5.61
# Execution count [1.05e+01]
lea 1(%rax), %edx #383.17
cmpl %esi, %edx #383.17
ja ..B5.30 # Prob 50% #383.17
# LOE rdi r10 eax esi r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5 zmm10 zmm14
..B5.27: # Preds ..B5.26
# Execution count [9.42e+00]
subl %eax, %esi #383.17
lea (%r12,%r9,2), %ebx #387.37
addl %r8d, %ebx #387.37
lea (%r9,%r12), %edx #385.32
vmovdqa32 %ymm8, %ymm19 #383.17
lea (%r12,%r8), %ecx #387.67
addl %edx, %r8d #385.32
xorl %r11d, %r11d #383.17
vpbroadcastd %esi, %ymm18 #383.17
lea (%rcx,%rax,2), %ecx #387.67
vmovdqu32 .L_2il0floatpacket.14(%rip), %zmm17 #385.32
vmovdqu32 .L_2il0floatpacket.15(%rip), %zmm20 #385.32
vmovdqu32 .L_2il0floatpacket.16(%rip), %zmm21 #385.32
lea (%rbx,%rax,2), %ebx #387.37
lea (%r8,%rax,2), %edx #385.32
# LOE rdi r10 edx ecx ebx esi r9d r11d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 ymm18 ymm19 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5 zmm10 zmm14 zmm17 zmm20 zmm21
..B5.28: # Preds ..B5.28 ..B5.27
# Execution count [5.23e+01]
vpcmpgtd %ymm19, %ymm18, %k5 #383.17
lea (%rdx,%r11,2), %eax #387.67
vpaddd %ymm12, %ymm19, %ymm19 #383.17
kmovw %k5, %r8d #383.17
vpmovm2q %k5, %zmm22 #386.34
vpbroadcastb %r8d, %zmm23 #385.32
vpmovd2m %zmm22, %k3 #386.34
vptestmb .L_2il0floatpacket.17(%rip), %zmm23, %k1 #385.32
kshiftrw $8, %k3, %k4 #386.34
kshiftrq $8, %k1, %k2 #385.32
movslq %eax, %rax #385.32
lea (%rbx,%r11,2), %r15d #387.37
movslq %r15d, %r15 #387.37
lea (%rcx,%r11,2), %r8d #387.67
movslq %r8d, %r8 #387.67
addl $8, %r11d #383.17
vmovaps %zmm2, %zmm22 #386.34
vmovupd 16(%rdi,%rax,8), %zmm27{%k3}{z} #386.34
vmovupd 80(%rdi,%rax,8), %zmm25{%k4}{z} #386.34
vmovupd 32(%rdi,%r15,8), %zmm23{%k1}{z} #387.37
vmovupd 96(%rdi,%r15,8), %zmm30{%k2}{z} #387.37
vmovupd 8(%rdi,%rax,8), %zmm15{%k3}{z} #386.64
vmovupd 72(%rdi,%rax,8), %zmm26{%k4}{z} #386.64
vmovupd 64(%rdi,%r8,8), %zmm31{%k2}{z} #387.67
vmovupd 16(%r10,%rax,8), %zmm16{%k1}{z} #385.32
vmovupd 80(%r10,%rax,8), %zmm24{%k2}{z} #385.32
vpermi2pd %zmm25, %zmm27, %zmm22 #386.34
vpermt2pd %zmm25, %zmm3, %zmm27 #386.34
vpermt2pd %zmm30, %zmm17, %zmm23 #387.37
vpermt2pd %zmm24, %zmm17, %zmm16 #385.32
vmovupd (%rdi,%r8,8), %zmm30{%k1}{z} #387.67
vfnmadd231pd %zmm22, %zmm4, %zmm27 #386.54
vpermt2pd %zmm31, %zmm17, %zmm30 #387.67
vmovaps %zmm2, %zmm28 #386.64
vpermi2pd %zmm26, %zmm15, %zmm28 #386.64
vpermt2pd %zmm26, %zmm3, %zmm15 #386.64
vfmsub213pd %zmm30, %zmm4, %zmm22 #387.82
vaddpd %zmm28, %zmm27, %zmm29 #386.64
vsubpd %zmm23, %zmm22, %zmm24 #387.82
vfmsub231pd %zmm1, %zmm29, %zmm16 #387.82
vfmsub213pd %zmm16, %zmm5, %zmm24 #387.82
vfnmadd231pd %zmm24, %zmm0, %zmm15 #389.21
vfmadd231pd %zmm24, %zmm24, %zmm10{%k5} #390.21
vpermpd %zmm15, %zmm20, %zmm16 #389.21
vpermpd %zmm15, %zmm21, %zmm15 #389.21
vmovupd %zmm16, 16(%rdi,%rax,8){%k1} #389.21
vmovupd %zmm15, 80(%rdi,%rax,8){%k2} #389.21
cmpl %esi, %r11d #383.17
jb ..B5.28 # Prob 82% #383.17
# LOE rdi r10 edx ecx ebx esi r9d r11d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 ymm18 ymm19 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5 zmm10 zmm14 zmm17 zmm20 zmm21
..B5.30: # Preds ..B5.28 ..B5.26
# Execution count [9.42e+00]
vaddpd %zmm14, %zmm10, %zmm14 #390.21
vshuff32x4 $238, %zmm14, %zmm14, %zmm10 #390.21
vaddpd %zmm14, %zmm10, %zmm15 #390.21
vpermpd $78, %zmm15, %zmm16 #390.21
vaddpd %zmm16, %zmm15, %zmm17 #390.21
vpermpd $177, %zmm17, %zmm18 #390.21
vaddpd %zmm18, %zmm17, %zmm19 #390.21
vaddsd %xmm6, %xmm19, %xmm6 #390.21
jmp ..B5.35 # Prob 100% #390.21
# LOE rdi r10 r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.31: # Preds ..B5.17
# Execution count [0.00e+00]
movl 208(%rsp), %r8d #387.67[spill]
imull %r14d, %r8d #387.67
lea (%r8,%r9,2), %eax #387.37
movl %eax, 432(%rsp) #387.37[spill]
# LOE rdi r10 r11 ebx r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.32: # Preds ..B5.21 ..B5.19 ..B5.31
# Execution count [9.42e+00]
shrl $1, %ebx #354.21
xorl %eax, %eax #383.17
lea (%r9,%r8), %edx #385.32
movl 432(%rsp), %r9d #385.32[spill]
lea (%rdi,%r11,8), %rcx #386.34
lea (%r10,%r11,8), %r11 #385.32
.align 16,0x90
# LOE rcx rdi r10 r11 eax edx ebx r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.33: # Preds ..B5.33 ..B5.32
# Execution count [5.23e+01]
lea (%rdx,%rax,2), %esi #387.57
movslq %esi, %rsi #385.32
lea (%r9,%rax,2), %r15d #387.37
movslq %r15d, %r15 #387.37
vmovsd 16(%rcx,%rsi,8), %xmm19 #387.57
vmulsd %xmm19, %xmm9, %xmm16 #387.57
vmovsd 24(%rcx,%rsi,8), %xmm10 #386.34
vmovsd 32(%rcx,%r15,8), %xmm15 #387.37
lea (%r8,%rax,2), %r15d #387.67
movslq %r15d, %r15 #387.67
incl %eax #383.17
vsubsd %xmm16, %xmm10, %xmm14 #386.54
vsubsd %xmm16, %xmm15, %xmm17 #387.57
vaddsd 8(%rcx,%rsi,8), %xmm14, %xmm20 #386.64
vaddsd (%rcx,%r15,8), %xmm17, %xmm18 #387.67
vfnmadd213sd 16(%r11,%rsi,8), %xmm7, %xmm20 #387.82
vfnmadd231sd %xmm13, %xmm18, %xmm20 #387.82
vfnmadd231sd %xmm20, %xmm11, %xmm19 #389.21
vfmadd231sd %xmm20, %xmm20, %xmm6 #390.21
vmovsd %xmm19, 16(%rcx,%rsi,8) #389.21
cmpl %ebx, %eax #383.17
jb ..B5.33 # Prob 82% #383.17
# LOE rcx rdi r10 r11 eax edx ebx r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.34: # Preds ..B5.33
# Execution count [9.42e+00]
movl 400(%rsp), %r9d #[spill]
# LOE rdi r10 r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.35: # Preds ..B5.34 ..B5.30 ..B5.15
# Execution count [2.09e+01]
negl %r12d #392.27
incl %r14d #382.13
addl $3, %r12d #392.27
cmpl %r13d, %r14d #382.13
jb ..B5.15 # Prob 82% #382.13
# LOE rdi r10 r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5
..B5.36: # Preds ..B5.35
# Execution count [3.77e+00]
vmovsd %xmm6, 328(%rsp) #[spill]
movl 368(%rsp), %ebx #[spill]
# LOE ebx r13d
..B5.37: # Preds ..B5.36 ..B5.13
# Execution count [4.19e+00]
negl %ebx #394.25
addl $3, %ebx #394.25
cmpl $1, 384(%rsp) #395.28[spill]
jne ..B5.40 # Prob 50% #395.28
# LOE ebx r13d
..B5.38: # Preds ..B5.37
# Execution count [2.09e+00]
movb 392(%rsp), %al #395.41[spill]
testb %al, %al #395.41
jne ..B5.40 # Prob 50% #395.41
# LOE ebx r13d
..B5.39: # Preds ..B5.38
# Execution count [1.05e+00]
vmovsd 40(%rsp), %xmm0 #395.13[spill]
vmovsd %xmm0, 360(%rsp) #395.13[spill]
jmp ..B5.41 # Prob 100% #395.13
# LOE ebx r13d
..B5.40: # Preds ..B5.37 ..B5.38
# Execution count [3.14e+00]
vmovsd .L_2il0floatpacket.9(%rip), %xmm0 #395.13
vmovsd 360(%rsp), %xmm1 #395.13[spill]
vfnmadd132sd 312(%rsp), %xmm0, %xmm1 #395.13[spill]
vdivsd %xmm1, %xmm0, %xmm2 #396.77
vmovsd %xmm2, 360(%rsp) #396.77[spill]
# LOE ebx r13d
..B5.41: # Preds ..B5.40 ..B5.39
# Execution count [4.19e+00]
movb 392(%rsp), %al #378.9[spill]
incb %al #378.9
movb %al, 392(%rsp) #378.9[spill]
cmpb $2, %al #378.9
jb ..B5.5 # Prob 50% #378.9
# LOE ebx r13d
..B5.42: # Preds ..B5.41
# Execution count [2.09e+00]
movl 400(%rsp), %ecx #[spill]
vmovsd 328(%rsp), %xmm0 #[spill]
vmovsd 304(%rsp), %xmm3 #[spill]
vmovsd 296(%rsp), %xmm1 #[spill]
movq 248(%rsp), %rax #[spill]
movq 256(%rsp), %r14 #[spill]
movl 264(%rsp), %r10d #[spill]
movq 272(%rsp), %r9 #[spill]
movq 280(%rsp), %r8 #[spill]
movl 288(%rsp), %edi #[spill]
movl 384(%rsp), %r11d #[spill]
movq 408(%rsp), %rdx #[spill]
movl 240(%rsp), %r12d #[spill]
testl %ecx, %ecx #399.36
jle ..B5.49 # Prob 50% #399.36
# LOE rax rdx r8 r9 r14 ecx edi r10d r11d r12d r13d xmm0 xmm1 xmm3
..B5.43: # Preds ..B5.42
# Execution count [2.09e+00]
movl $1, %esi #399.9
xorl %ebx, %ebx #399.9
testl %r10d, %r10d #399.9
je ..B5.47 # Prob 10% #399.9
# LOE rax rdx r8 r9 r14 ecx ebx esi edi r10d r11d r12d r13d xmm0 xmm1 xmm3
..B5.44: # Preds ..B5.43
# Execution count [1.88e+00]
movl %r11d, 384(%rsp) #[spill]
movl %r12d, 240(%rsp) #[spill]
movl %r13d, 424(%rsp) #[spill]
movl %ecx, 400(%rsp) #[spill]
movl 192(%rsp), %r12d #[spill]
movl 200(%rsp), %r11d #[spill]
.align 16,0x90
# LOE rax rdx r8 r9 r14 ebx edi r10d r11d r12d xmm0 xmm1 xmm3
..B5.45: # Preds ..B5.45 ..B5.44
# Execution count [5.23e+00]
movslq %ebx, %r13 #400.35
lea (%r12,%rbx,2), %ecx #356.19
shlq $4, %r13 #400.35
lea (%r11,%rbx,2), %esi #356.19
movslq %ecx, %rcx #401.35
incl %ebx #399.9
movslq %esi, %rsi #401.13
movq 24(%r9,%r13), %r15 #400.35
movq %r15, 8(%rdx,%r13) #400.13
movq 8(%rdx,%rcx,8), %r15 #401.35
movq %r15, 24(%rdx,%rsi,8) #401.13
movq 32(%r9,%r13), %r15 #400.35
movq %r15, 16(%rdx,%r13) #400.13
movq 16(%rdx,%rcx,8), %r13 #401.35
movq %r13, 32(%rdx,%rsi,8) #401.13
cmpl %r10d, %ebx #399.9
jb ..B5.45 # Prob 64% #399.9
# LOE rax rdx r8 r9 r14 ebx edi r10d r11d r12d xmm0 xmm1 xmm3
..B5.46: # Preds ..B5.45
# Execution count [1.88e+00]
movl 384(%rsp), %r11d #[spill]
lea 1(%rbx,%rbx), %esi #400.13
movl 240(%rsp), %r12d #[spill]
movl 424(%rsp), %r13d #[spill]
movl 400(%rsp), %ecx #[spill]
# LOE rax rdx r8 r9 r14 ecx esi edi r10d r11d r12d r13d xmm0 xmm1 xmm3
..B5.47: # Preds ..B5.46 ..B5.43
# Execution count [2.09e+00]
lea -1(%rsi), %ebx #399.9
cmpl %ecx, %ebx #399.9
jae ..B5.49 # Prob 10% #399.9
# LOE rax rdx r8 r9 r14 ecx esi edi r10d r11d r12d r13d xmm0 xmm1 xmm3
..B5.48: # Preds ..B5.47
# Execution count [1.88e+00]
movslq %esi, %rsi #400.35
movq 16(%r9,%rsi,8), %rbx #400.35
movq %rbx, (%rdx,%rsi,8) #400.13
movq (%rax,%rsi,8), %r15 #401.35
movq %r15, 16(%r14,%rsi,8) #401.13
# LOE rax rdx r8 r9 r14 ecx edi r10d r11d r12d r13d xmm0 xmm1 xmm3
..B5.49: # Preds ..B5.42 ..B5.47 ..B5.48
# Execution count [2.09e+00]
testl %r13d, %r13d #404.41
jle ..B5.56 # Prob 50% #404.41
# LOE rax rdx r8 r9 r14 ecx edi r10d r11d r12d r13d xmm0 xmm1 xmm3
..B5.50: # Preds ..B5.49
# Execution count [2.09e+00]
xorl %ebx, %ebx #404.9
movl $1, %r15d #404.9
xorl %esi, %esi #405.13
testl %edi, %edi #404.9
je ..B5.54 # Prob 10% #404.9
# LOE rax rdx r8 r9 r14 ecx ebx esi edi r10d r11d r12d r13d r15d xmm0 xmm1 xmm3
..B5.51: # Preds ..B5.50
# Execution count [1.88e+00]
movl %r12d, 240(%rsp) #[spill]
movl %r13d, 424(%rsp) #[spill]
movl %r11d, 384(%rsp) #[spill]
movl 48(%rsp), %r13d #[spill]
movl 56(%rsp), %r12d #[spill]
.align 16,0x90
# LOE rax rdx r8 r9 r14 ecx ebx esi edi r10d r12d r13d xmm0 xmm1 xmm3
..B5.52: # Preds ..B5.52 ..B5.51
# Execution count [5.23e+00]
movl %esi, %r15d #405.30
incl %ebx #404.9
subl %ecx, %r15d #405.30
lea (%r15,%rcx,2), %r11d #405.30
movslq %r11d, %r11 #405.30
movq 24(%rdx,%r11,8), %r15 #405.30
movq %r15, 16(%rdx,%r11,8) #405.13
lea (%rsi,%rcx,2), %r11d #406.30
movslq %r11d, %r11 #406.30
movq 16(%rdx,%r11,8), %r15 #406.30
movq %r15, 24(%rdx,%r11,8) #406.13
movq 40(%rdx,%r11,8), %r15 #405.30
movq %r15, 32(%rdx,%r11,8) #405.13
lea (%r12,%rsi), %r11d #387.67
movslq %r11d, %r11 #406.30
addl %r13d, %esi #404.9
movq 32(%rdx,%r11,8), %r15 #406.30
movq %r15, 40(%rdx,%r11,8) #406.13
cmpl %edi, %ebx #404.9
jb ..B5.52 # Prob 64% #404.9
# LOE rax rdx r8 r9 r14 ecx ebx esi edi r10d r12d r13d xmm0 xmm1 xmm3
..B5.53: # Preds ..B5.52
# Execution count [1.88e+00]
movl 384(%rsp), %r11d #[spill]
lea 1(%rbx,%rbx), %r15d #405.13
movl 240(%rsp), %r12d #[spill]
movl 424(%rsp), %r13d #[spill]
# LOE rax rdx r8 r9 r14 ecx edi r10d r11d r12d r13d r15d xmm0 xmm1 xmm3
..B5.54: # Preds ..B5.53 ..B5.50
# Execution count [2.09e+00]
lea -1(%r15), %ebx #404.9
cmpl %r13d, %ebx #404.9
jae ..B5.56 # Prob 10% #404.9
# LOE rax rdx r8 r9 r14 ecx edi r10d r11d r12d r13d r15d xmm0 xmm1 xmm3
..B5.55: # Preds ..B5.54
# Execution count [1.88e+00]
imull 208(%rsp), %r15d #405.30[spill]
addl 216(%rsp), %r15d #405.30[spill]
movslq %r15d, %r15 #405.30
movq 8(%r9,%r15,8), %rbx #405.30
movq %rbx, (%r9,%r15,8) #405.13
movq (%r8,%r15,8), %rsi #406.30
movq %rsi, 8(%r8,%r15,8) #406.13
# LOE rax rdx r8 r9 r14 ecx edi r10d r11d r12d r13d xmm0 xmm1 xmm3
..B5.56: # Preds ..B5.49 ..B5.54 ..B5.55
# Execution count [2.09e+00]
vdivsd %xmm3, %xmm0, %xmm2 #409.37
movl %r11d, %ebx #413.9
vcomisd %xmm1, %xmm2 #374.20
jae ..B5.3 # Prob 82% #374.20
# LOE rax rdx r8 r9 r14 ecx ebx edi r10d r11d r12d r13d xmm1 xmm2 xmm3
..B5.57: # Preds ..B5.3 ..B5.56
# Execution count [3.77e-01]
vmovsd 360(%rsp), %xmm0 #[spill]
# LOE ebx xmm0 xmm2
..B5.58: # Preds ..B5.57 ..B5.1
# Execution count [1.00e+00]
movl $.L_2__STRING.7, %edi #416.5
movl $1, %eax #416.5
vzeroupper #416.5
vmovsd %xmm2, (%rsp) #416.5[spill]
..___tag_value_solveRBA.541:
# printf(const char *__restrict__, ...)
call printf #416.5
..___tag_value_solveRBA.542:
# LOE ebx
..B5.59: # Preds ..B5.58
# Execution count [1.00e+00]
vmovsd (%rsp), %xmm2 #[spill]
movl $.L_2__STRING.8, %edi #417.5
vsqrtsd %xmm2, %xmm2, %xmm2 #417.5
movl %ebx, %esi #417.5
movl $1, %eax #417.5
vmovapd %xmm2, %xmm0 #417.5
..___tag_value_solveRBA.545:
# printf(const char *__restrict__, ...)
call printf #417.5
..___tag_value_solveRBA.546:
# LOE
..B5.60: # Preds ..B5.59
# Execution count [1.00e+00]
addq $472, %rsp #418.1
.cfi_restore 3
popq %rbx #418.1
.cfi_restore 15
popq %r15 #418.1
.cfi_restore 14
popq %r14 #418.1
.cfi_restore 13
popq %r13 #418.1
.cfi_restore 12
popq %r12 #418.1
movq %rbp, %rsp #418.1
popq %rbp #418.1
.cfi_def_cfa 7, 8
.cfi_restore 6
ret #418.1
.cfi_def_cfa 6, 16
.cfi_escape 0x10, 0x03, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd8, 0xff, 0xff, 0xff, 0x22
.cfi_offset 6, -16
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf0, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0f, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x22
# LOE
..B5.61: # Preds ..B5.22
# Execution count [9.42e-01]: Infreq
xorl %eax, %eax #383.17
jmp ..B5.26 # Prob 100% #383.17
.align 16,0x90
# LOE rdi r10 eax esi r8d r9d r12d r13d r14d xmm6 xmm7 xmm9 xmm11 xmm13 ymm8 ymm12 zmm0 zmm1 zmm2 zmm3 zmm4 zmm5 zmm10 zmm14
.cfi_endproc
# mark_end;
.type solveRBA,@function
.size solveRBA,.-solveRBA
..LNsolveRBA.4:
.data
# -- End solveRBA
.text
.L_2__routine_start_writeResult_5:
# -- Begin writeResult
.text
# mark_begin;
.align 16,0x90
.globl writeResult
# --- writeResult(Solver *, double *, char *)
writeResult:
# parameter 1: %rdi
# parameter 2: %rsi
# parameter 3: %rdx
..B6.1: # Preds ..B6.0
# Execution count [1.00e+00]
.cfi_startproc
..___tag_value_writeResult.562:
..L563:
#421.1
pushq %r15 #421.1
.cfi_def_cfa_offset 16
.cfi_offset 15, -16
pushq %rbx #421.1
.cfi_def_cfa_offset 24
.cfi_offset 3, -24
pushq %rbp #421.1
.cfi_def_cfa_offset 32
.cfi_offset 6, -32
subq $64, %rsp #421.1
.cfi_def_cfa_offset 96
movq %rsi, %r15 #421.1
movl 24(%rdi), %ebp #422.17
movl $.L_2__STRING.9, %esi #427.10
movl 28(%rdi), %ebx #423.17
movq %rdx, %rdi #427.10
# fopen(const char *__restrict__, const char *__restrict__)
call fopen #427.10
# LOE rax r12 r13 r14 r15 ebx ebp
..B6.19: # Preds ..B6.1
# Execution count [1.00e+00]
movq %rax, %rdi #427.10
# LOE rdi r12 r13 r14 r15 ebx ebp
..B6.2: # Preds ..B6.19
# Execution count [1.00e+00]
testq %rdi, %rdi #429.15
je ..B6.15 # Prob 0% #429.15
# LOE rdi r12 r13 r14 r15 ebx ebp
..B6.3: # Preds ..B6.2
# Execution count [9.93e-01]
addl $2, %ebx #434.32
xorl %ecx, %ecx #434.16
testl %ebx, %ebx #434.32
jle ..B6.13 # Prob 10% #434.32
# LOE rdi r12 r13 r14 r15 ecx ebx ebp
..B6.4: # Preds ..B6.3
# Execution count [8.94e-01]
movslq %ebp, %rsi #435.9
lea 2(%rbp), %edx #435.36
addq $2, %rsi #435.36
movq %rsi, 48(%rsp) #434.16[spill]
movl %ebx, 56(%rsp) #434.16[spill]
movq %r15, %rbx #434.16
movq %r12, (%rsp) #434.16[spill]
.cfi_offset 12, -96
movl %ecx, %r12d #434.16
movq %r13, 8(%rsp) #434.16[spill]
.cfi_offset 13, -88
movl %ecx, %r15d #434.16
movq %r14, 16(%rsp) #434.16[spill]
.cfi_offset 14, -80
movl %edx, %r14d #434.16
movq %rdi, %r13 #434.16
# LOE rbx r13 ebp r12d r14d r15d
..B6.5: # Preds ..B6.11 ..B6.4
# Execution count [4.96e+00]
xorl %edx, %edx #435.20
testl %r14d, %r14d #435.36
jle ..B6.10 # Prob 10% #435.36
# LOE rdx rbx r13 ebp r12d r14d r15d
..B6.6: # Preds ..B6.5
# Execution count [4.47e+00]
movslq %r12d, %r12 #436.32
movl %r15d, 40(%rsp) #436.32[spill]
movl %ebp, 32(%rsp) #436.32[spill]
movq %rdx, %rbp #436.32
movq %rbx, 24(%rsp) #436.32[spill]
movq 48(%rsp), %r15 #436.32[spill]
lea (%rbx,%r12,8), %rax #436.32
movq %rax, %rbx #436.32
# LOE rbx rbp r13 r15 r12d r14d
..B6.7: # Preds ..B6.8 ..B6.6
# Execution count [2.48e+01]
vmovsd (%rbx,%rbp,8), %xmm0 #436.13
movq %r13, %rdi #436.13
movl $.L_2__STRING.11, %esi #436.13
movl $1, %eax #436.13
# fprintf(FILE *__restrict__, const char *__restrict__, ...)
call fprintf #436.13
# LOE rbx rbp r13 r15 r12d r14d
..B6.8: # Preds ..B6.7
# Execution count [2.48e+01]
incq %rbp #435.39
cmpq %r15, %rbp #435.36
jl ..B6.7 # Prob 82% #435.36
# LOE rbx rbp r13 r15 r12d r14d
..B6.9: # Preds ..B6.8
# Execution count [4.47e+00]
movl 40(%rsp), %r15d #[spill]
movl 32(%rsp), %ebp #[spill]
movq 24(%rsp), %rbx #[spill]
# LOE rbx r13 ebp r12d r14d r15d
..B6.10: # Preds ..B6.9 ..B6.5
# Execution count [4.96e+00]
movl $10, %edi #438.9
movq %r13, %rsi #438.9
call fputc #438.9
# LOE rbx r13 ebp r12d r14d r15d
..B6.11: # Preds ..B6.10
# Execution count [4.96e+00]
incl %r15d #434.35
lea 2(%r12,%rbp), %r12d #434.35
cmpl 56(%rsp), %r15d #434.32[spill]
jl ..B6.5 # Prob 82% #434.32
# LOE rbx r13 ebp r12d r14d r15d
..B6.12: # Preds ..B6.11
# Execution count [8.94e-01]
movq (%rsp), %r12 #[spill]
.cfi_restore 12
movq %r13, %rdi #
movq 8(%rsp), %r13 #[spill]
.cfi_restore 13
movq 16(%rsp), %r14 #[spill]
.cfi_restore 14
# LOE rdi r12 r13 r14
..B6.13: # Preds ..B6.12 ..B6.3
# Execution count [9.93e-01]
addq $64, %rsp #441.5
.cfi_def_cfa_offset 32
.cfi_restore 6
popq %rbp #441.5
.cfi_def_cfa_offset 24
.cfi_restore 3
popq %rbx #441.5
.cfi_def_cfa_offset 16
.cfi_restore 15
popq %r15 #441.5
.cfi_def_cfa_offset 8
# fclose(FILE *)
jmp fclose #441.5
.cfi_def_cfa_offset 96
.cfi_offset 3, -24
.cfi_offset 6, -32
.cfi_offset 15, -16
# LOE
..B6.15: # Preds ..B6.2
# Execution count [7.13e-03]: Infreq
movl $il0_peep_printf_format_1, %edi #430.9
call puts #430.9
# LOE
..B6.16: # Preds ..B6.15
# Execution count [7.13e-03]: Infreq
movl $1, %edi #431.9
# exit(int)
call exit #431.9
.align 16,0x90
# LOE
.cfi_endproc
# mark_end;
.type writeResult,@function
.size writeResult,.-writeResult
..LNwriteResult.5:
.section .rodata.str1.4, "aMS",@progbits,1
.space 1, 0x00 # pad
.align 4
il0_peep_printf_format_1:
.long 1869771333
.word 8562
.byte 0
.data
# -- End writeResult
.text
.L_2__routine_start_initSolver_6:
# -- Begin initSolver
.text
# mark_begin;
.align 16,0x90
.globl initSolver
# --- initSolver(Solver *, Parameter *, int)
initSolver:
# parameter 1: %rdi
# parameter 2: %rsi
# parameter 3: %edx
..B7.1: # Preds ..B7.0
# Execution count [1.00e+00]
.cfi_startproc
..___tag_value_initSolver.604:
..L605:
#110.1
pushq %rbp #110.1
.cfi_def_cfa_offset 16
movq %rsp, %rbp #110.1
.cfi_def_cfa 6, 16
.cfi_offset 6, -16
andq $-64, %rsp #110.1
pushq %r12 #110.1
pushq %r13 #110.1
pushq %r14 #110.1
pushq %r15 #110.1
pushq %rbx #110.1
subq $408, %rsp #110.1
.cfi_escape 0x10, 0x03, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf0, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0f, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x22
movq %rdi, %r15 #110.1
movq %rsi, %rbx #110.1
movl $1140850688, %edi #111.5
movl %edx, 24(%rsp) #110.1[spill]
lea 36(%r15), %rsi #111.5
..___tag_value_initSolver.615:
# MPI_Comm_rank(MPI_Comm, int *)
call MPI_Comm_rank #111.5
..___tag_value_initSolver.616:
# LOE rbx r15
..B7.2: # Preds ..B7.1
# Execution count [1.00e+00]
movl $1140850688, %edi #112.5
lea 40(%r15), %rsi #112.5
..___tag_value_initSolver.617:
# MPI_Comm_size(MPI_Comm, int *)
call MPI_Comm_size #112.5
..___tag_value_initSolver.618:
# LOE rbx r15
..B7.3: # Preds ..B7.2
# Execution count [1.00e+00]
movl 20(%rbx), %eax #114.25
xorl %ecx, %ecx #115.5
movl %eax, 28(%r15) #114.5
movl $.L_2__STRING.5, %edi #116.5
cltd #115.25
idivl 40(%r15) #115.25
movl 36(%r15), %esi #115.36
cmpl %esi, %edx #115.5
movl 16(%rbx), %r8d #113.25
movl %r8d, %edx #116.5
setg %cl #115.5
addl %eax, %ecx #115.25
xorl %eax, %eax #116.5
movl %ecx, 32(%r15) #115.5
movl %r8d, 24(%r15) #113.5
..___tag_value_initSolver.619:
# printf(const char *__restrict__, ...)
call printf #116.5
..___tag_value_initSolver.620:
# LOE rbx r15
..B7.4: # Preds ..B7.3
# Execution count [1.00e+00]
vxorpd %xmm4, %xmm4, %xmm4 #122.41
vxorpd %xmm1, %xmm1, %xmm1 #121.41
vcvtsi2sd 20(%rbx), %xmm4, %xmm4 #122.41
vcvtsi2sd 16(%rbx), %xmm1, %xmm1 #121.41
vmovsd 8(%rbx), %xmm3 #122.23
vxorpd %xmm6, %xmm6, %xmm6 #123.38
vdivsd %xmm4, %xmm3, %xmm5 #122.41
vmovsd (%rbx), %xmm0 #121.23
movl $64, %edi #131.21
vdivsd %xmm1, %xmm0, %xmm2 #121.41
movl 32(%r15), %r12d #123.38
movl 36(%r15), %r14d #123.23
imull %r12d, %r14d #123.38
vmovsd %xmm2, (%r15) #121.5
vmovsd %xmm5, 8(%r15) #122.5
movl 24(%r15), %edx #128.21
vcvtsi2sd %r14d, %xmm6, %xmm6 #123.38
movq 32(%rbx), %r13 #124.23
movq 40(%rbx), %rax #125.23
movl 24(%rbx), %ebx #126.23
movl %ebx, 88(%r15) #126.5
lea 2(%rdx), %ebx #131.42
movq %r13, 64(%r15) #124.5
lea 2(%r12), %r13d #131.60
movl %ebx, %esi #131.21
imull %r13d, %esi #131.21
vmulsd %xmm6, %xmm5, %xmm7 #123.58
movslq %esi, %rsi #131.21
shlq $3, %rsi #131.21
vmovsd %xmm7, 16(%r15) #123.5
movq %rax, 72(%r15) #125.5
movl %edx, 40(%rsp) #128.21[spill]
movl 28(%r15), %r14d #129.21
..___tag_value_initSolver.622:
# allocate(int, size_t)
call allocate #131.21
..___tag_value_initSolver.623:
# LOE rax r15 ebx r12d r13d r14d
..B7.5: # Preds ..B7.4
# Execution count [1.00e+00]
movq %rax, 48(%r15) #131.5
lea 2(%r14), %eax #132.55
movl %ebx, %esi #132.21
movl $64, %edi #132.21
imull %eax, %esi #132.21
movslq %esi, %rsi #132.21
shlq $3, %rsi #132.21
movl %eax, 32(%rsp) #132.55[spill]
..___tag_value_initSolver.624:
# allocate(int, size_t)
call allocate #132.21
..___tag_value_initSolver.625:
# LOE rax r15 ebx r12d r13d r14d
..B7.6: # Preds ..B7.5
# Execution count [1.00e+00]
movq %rax, 56(%r15) #132.5
xorl %r9d, %r9d #139.5
vmovsd (%r15), %xmm6 #134.19
vmovsd 8(%r15), %xmm5 #135.19
testl %r13d, %r13d #139.37
movq 48(%r15), %r13 #136.19
jle ..B7.27 # Prob 9% #139.37
# LOE rax r9 r13 r15 ebx r12d r14d xmm5 xmm6
..B7.7: # Preds ..B7.6
# Execution count [9.00e-01]
vmovsd .L_2il0floatpacket.18(%rip), %xmm1 #142.27
movl %ebx, %r8d #141.9
vmulsd %xmm1, %xmm6, %xmm0 #142.38
andl $-8, %r8d #141.9
vmovdqu .L_2il0floatpacket.7(%rip), %ymm3 #141.9
vmovdqu .L_2il0floatpacket.6(%rip), %ymm2 #142.23
vbroadcastsd %xmm0, %zmm0 #142.38
vmovsd %xmm5, 304(%rsp) #139.5[spill]
vmovsd %xmm6, 16(%rsp) #139.5[spill]
movslq 40(%rsp), %rdi #142.13[spill]
movq %r13, %rcx #139.5
movslq %r12d, %rdx #139.5
xorl %r12d, %r12d #139.5
addq $2, %rdx #139.37
vmovups %zmm0, 128(%rsp) #139.5[spill]
lea 16(,%rdi,8), %rsi #142.13
movq %rcx, 312(%rsp) #139.5[spill]
movq %rdx, 264(%rsp) #139.5[spill]
movq %rsi, 272(%rsp) #139.5[spill]
movq %rdi, 280(%rsp) #139.5[spill]
movl %r8d, (%rsp) #139.5[spill]
movq %r9, 288(%rsp) #139.5[spill]
movq %rax, 48(%rsp) #139.5[spill]
movl %r14d, 8(%rsp) #139.5[spill]
movq %r15, 296(%rsp) #139.5[spill]
vpxord %zmm4, %zmm4, %zmm4 #142.23
# LOE r12 r13 ebx
..B7.8: # Preds ..B7.25 ..B7.7
# Execution count [5.00e+00]
vxorpd %xmm1, %xmm1, %xmm1 #140.33
movq 288(%rsp), %rax #140.37[spill]
vcvtsi2sd %eax, %xmm1, %xmm1 #140.33
movq 296(%rsp), %rcx #140.37[spill]
vmovsd 304(%rsp), %xmm0 #140.37[spill]
vfmadd213sd 16(%rcx), %xmm0, %xmm1 #140.37
vmovsd %xmm1, 352(%rsp) #140.37[spill]
testl %ebx, %ebx #141.36
jle ..B7.25 # Prob 50% #141.36
# LOE r12 r13 ebx
..B7.9: # Preds ..B7.8
# Execution count [4.50e+00]
cmpl $8, %ebx #141.9
jl ..B7.77 # Prob 10% #141.9
# LOE r12 r13 ebx
..B7.10: # Preds ..B7.9
# Execution count [4.50e+00]
cmpl $1001, %ebx #141.9
jl ..B7.76 # Prob 10% #141.9
# LOE r12 r13 ebx
..B7.11: # Preds ..B7.10
# Execution count [4.50e+00]
movq 312(%rsp), %r15 #141.9[spill]
andq $63, %r15 #141.9
testl $7, %r15d #141.9
je ..B7.13 # Prob 50% #141.9
# LOE r12 r13 ebx r15d
..B7.12: # Preds ..B7.11
# Execution count [2.25e+00]
xorl %r15d, %r15d #141.9
jmp ..B7.15 # Prob 100% #141.9
# LOE r12 r13 ebx r15d
..B7.13: # Preds ..B7.11
# Execution count [2.25e+00]
testl %r15d, %r15d #141.9
je ..B7.15 # Prob 50% #141.9
# LOE r12 r13 ebx r15d
..B7.14: # Preds ..B7.13
# Execution count [2.50e+01]
negl %r15d #141.9
addl $64, %r15d #141.9
shrl $3, %r15d #141.9
cmpl %r15d, %ebx #141.9
cmovl %ebx, %r15d #141.9
# LOE r12 r13 ebx r15d
..B7.15: # Preds ..B7.12 ..B7.14 ..B7.13
# Execution count [5.00e+00]
movl %ebx, %r14d #141.9
subl %r15d, %r14d #141.9
andl $7, %r14d #141.9
negl %r14d #141.9
addl %ebx, %r14d #141.9
cmpl $1, %r15d #141.9
jb ..B7.19 # Prob 50% #141.9
# LOE r12 r13 ebx r14d r15d
..B7.16: # Preds ..B7.15
# Execution count [4.50e+00]
vmovdqu .L_2il0floatpacket.7(%rip), %ymm0 #141.9
vmovsd .L_2il0floatpacket.18(%rip), %xmm2 #142.48
vpbroadcastd %r15d, %ymm1 #141.9
vmovdqu %ymm0, 96(%rsp) #141.9[spill]
vmulsd 352(%rsp), %xmm2, %xmm0 #142.48[spill]
vmovdqu %ymm1, 64(%rsp) #141.9[spill]
movq $0, 256(%rsp) #141.9[spill]
vzeroupper #142.48
call sin #142.48
# LOE r12 r13 ebx r14d r15d xmm0
..B7.82: # Preds ..B7.16
# Execution count [4.50e+00]
movl %ebx, 56(%rsp) #141.9[spill]
vbroadcastsd %xmm0, %zmm16 #142.48
vmovdqu32 64(%rsp), %ymm18 #141.9[spill]
vmovdqu32 96(%rsp), %ymm17 #141.9[spill]
vmovups 128(%rsp), %zmm19 #141.9[spill]
vmovdqu32 .L_2il0floatpacket.6(%rip), %ymm20 #141.9
movslq %r15d, %rsi #141.9
movq 256(%rsp), %rbx #141.9[spill]
movq 312(%rsp), %rdi #141.9[spill]
vpxord %zmm21, %zmm21, %zmm21 #141.9
# LOE rbx rsi rdi r12 r13 r14d r15d ymm17 ymm18 ymm20 zmm16 zmm19 zmm21
..B7.17: # Preds ..B7.83 ..B7.82
# Execution count [2.50e+01]
vpcmpgtd %ymm17, %ymm18, %k4 #141.9
vmovaps %zmm21, %zmm0 #142.23
kmovw %k4, %k1 #142.23
vcvtdq2pd %ymm17, %zmm2 #142.38
vmulpd %zmm2, %zmm19, %zmm1 #142.42
..___tag_value_initSolver.655:
call *__svml_sin8_mask_z0@GOTPCREL(%rip) #142.23
..___tag_value_initSolver.656:
# LOE rbx rsi rdi r12 r13 r14d r15d ymm17 ymm18 ymm20 zmm0 zmm16 zmm19 zmm21 k4
..B7.83: # Preds ..B7.17
# Execution count [2.50e+01]
vpaddd %ymm20, %ymm17, %ymm17 #141.9
vaddpd %zmm0, %zmm16, %zmm1 #142.48
vmovupd %zmm1, (%rdi,%rbx,8){%k4} #142.13
addq $8, %rbx #141.9
cmpq %rsi, %rbx #141.9
jb ..B7.17 # Prob 82% #141.9
# LOE rbx rsi rdi r12 r13 r14d r15d ymm17 ymm18 ymm20 zmm16 zmm19 zmm21
..B7.18: # Preds ..B7.83
# Execution count [4.50e+00]
movl 56(%rsp), %ebx #[spill]
cmpl %r15d, %ebx #141.9
je ..B7.25 # Prob 10% #141.9
# LOE r12 r13 ebx r14d r15d
..B7.19: # Preds ..B7.18 ..B7.15 ..B7.76
# Execution count [2.50e+01]
vpbroadcastd %r15d, %ymm0 #142.23
lea 8(%r15), %eax #141.9
vpaddd .L_2il0floatpacket.20(%rip), %ymm0, %ymm1 #142.23
vmovdqu %ymm1, 320(%rsp) #142.23[spill]
cmpl %eax, %r14d #141.9
jl ..B7.23 # Prob 50% #141.9
# LOE r12 r13 ebx r14d r15d
..B7.20: # Preds ..B7.19
# Execution count [4.50e+00]
vmovsd .L_2il0floatpacket.18(%rip), %xmm0 #142.48
vmulsd 352(%rsp), %xmm0, %xmm0 #142.48[spill]
movslq %r15d, %r15 #141.9
vzeroupper #142.48
call sin #142.48
# LOE r12 r13 r15 ebx r14d r15d xmm0
..B7.84: # Preds ..B7.20
# Execution count [4.50e+00]
vbroadcastsd %xmm0, %zmm16 #142.48
vmovdqu32 320(%rsp), %ymm17 #142.48[spill]
vmovups 128(%rsp), %zmm18 #142.48[spill]
vmovdqu32 .L_2il0floatpacket.6(%rip), %ymm19 #142.48
movq %r15, %rsi #142.48
movq 312(%rsp), %rdi #142.48[spill]
# LOE rsi rdi r12 r13 ebx r14d r15d ymm17 ymm19 zmm16 zmm18
..B7.21: # Preds ..B7.85 ..B7.84
# Execution count [2.50e+01]
vcvtdq2pd %ymm17, %zmm1 #142.38
vmulpd %zmm1, %zmm18, %zmm0 #142.42
..___tag_value_initSolver.663:
call *__svml_sin8_z0@GOTPCREL(%rip) #142.23
..___tag_value_initSolver.664:
# LOE rsi rdi r12 r13 ebx r14d r15d ymm17 ymm19 zmm0 zmm16 zmm18
..B7.85: # Preds ..B7.21
# Execution count [2.50e+01]
addl $8, %r15d #141.9
vpaddd %ymm19, %ymm17, %ymm17 #142.23
vaddpd %zmm0, %zmm16, %zmm1 #142.48
vmovupd %zmm1, (%rdi,%rsi,8) #142.13
addq $8, %rsi #141.9
cmpl %r14d, %r15d #141.9
jb ..B7.21 # Prob 82% #141.9
# LOE rsi rdi r12 r13 ebx r14d r15d ymm17 ymm19 zmm16 zmm18
..B7.23: # Preds ..B7.85 ..B7.19 ..B7.77
# Execution count [5.00e+00]
lea 1(%r14), %eax #141.9
cmpl %ebx, %eax #141.9
ja ..B7.25 # Prob 50% #141.9
# LOE r12 r13 ebx r14d
..B7.24: # Preds ..B7.23
# Execution count [2.50e+01]
vpbroadcastd %r14d, %ymm1 #142.23
movl %ebx, %eax #141.9
vpaddd .L_2il0floatpacket.20(%rip), %ymm1, %ymm2 #142.23
subl %r14d, %eax #141.9
vpbroadcastd %eax, %ymm4 #141.9
vpcmpgtd .L_2il0floatpacket.7(%rip), %ymm4, %k1 #141.9
kmovw %k1, 360(%rsp) #141.9[spill]
vcvtdq2pd %ymm2, %zmm3 #142.38
vmulpd 128(%rsp), %zmm3, %zmm1 #142.42[spill]
vpxord %zmm0, %zmm0, %zmm0 #142.23
..___tag_value_initSolver.667:
call *__svml_sin8_mask_z0@GOTPCREL(%rip) #142.23
..___tag_value_initSolver.668:
# LOE r12 r13 ebx r14d zmm0
..B7.87: # Preds ..B7.24
# Execution count [2.50e+01]
vmovups %zmm0, 192(%rsp) #142.23[spill]
vmovsd .L_2il0floatpacket.18(%rip), %xmm0 #142.48
vmulsd 352(%rsp), %xmm0, %xmm0 #142.48[spill]
vzeroupper #142.48
call sin #142.48
# LOE r12 r13 ebx r14d xmm0
..B7.86: # Preds ..B7.87
# Execution count [2.50e+01]
vbroadcastsd %xmm0, %zmm1 #142.48
kmovw 360(%rsp), %k1 #142.13[spill]
vaddpd 192(%rsp), %zmm1, %zmm2 #142.48[spill]
movslq %r14d, %r14 #142.13
addq %r12, %r14 #142.13
vmovupd %zmm2, (%r13,%r14,8){%k1} #142.13
# LOE r12 r13 ebx
..B7.25: # Preds ..B7.18 ..B7.23 ..B7.8 ..B7.86
# Execution count [5.00e+00]
movq 280(%rsp), %rax #139.5[spill]
movq 312(%rsp), %rcx #139.5[spill]
movq 288(%rsp), %rsi #139.5[spill]
incq %rsi #139.5
lea 2(%r12,%rax), %r12 #139.5
addq 272(%rsp), %rcx #139.5[spill]
movq %rcx, 312(%rsp) #139.5[spill]
movq %rsi, 288(%rsp) #139.5[spill]
cmpq 264(%rsp), %rsi #139.5[spill]
jb ..B7.8 # Prob 82% #139.5
# LOE r12 r13 ebx
..B7.26: # Preds ..B7.25
# Execution count [9.00e-01]
vmovsd 16(%rsp), %xmm6 #[spill]
movq 48(%rsp), %rax #[spill]
movl 8(%rsp), %r14d #[spill]
# LOE rax ebx r14d xmm6
..B7.27: # Preds ..B7.26 ..B7.6
# Execution count [1.00e+00]
cmpl $2, 24(%rsp) #146.20[spill]
je ..B7.48 # Prob 16% #146.20
# LOE rax ebx r14d xmm6
..B7.28: # Preds ..B7.27
# Execution count [8.40e-01]
xorl %edx, %edx #153.9
cmpl $0, 32(%rsp) #153.36[spill]
jle ..B7.45 # Prob 9% #153.36
# LOE rax rdx ebx r14d
..B7.29: # Preds ..B7.28
# Execution count [7.56e-01]
movslq 40(%rsp), %rcx #155.17[spill]
movl %ebx, %esi #154.13
movslq %r14d, %r14 #153.9
andl $-8, %esi #154.13
movq %rdx, %rdi #153.9
addq $2, %r14 #153.36
vmovdqu .L_2il0floatpacket.7(%rip), %ymm0 #154.13
lea 16(,%rcx,8), %r12 #155.17
movslq %esi, %rcx #154.13
xorl %r13d, %r13d #153.9
movq %rax, %r15 #153.9
movl %ebx, %edx #153.9
movq %rdi, %rbx #153.9
vpxord %zmm1, %zmm1, %zmm1 #155.29
# LOE rax rcx rbx r12 r13 r14 r15 edx esi ymm0 zmm1
..B7.30: # Preds ..B7.43 ..B7.29
# Execution count [7.56e-01]
testl %edx, %edx #154.40
jle ..B7.43 # Prob 50% #154.40
# LOE rax rcx rbx r12 r13 r14 r15 edx esi ymm0 zmm1
..B7.31: # Preds ..B7.30
# Execution count [0.00e+00]
cmpl $12, %edx #154.13
jle ..B7.37 # Prob 0% #154.13
# LOE rax rcx rbx r12 r13 r14 r15 edx esi ymm0 zmm1
..B7.32: # Preds ..B7.31
# Execution count [2.48e+00]
movq %rcx, (%rsp) #[spill]
movl %esi, 8(%rsp) #[spill]
movq %rax, 48(%rsp) #[spill]
movl %edx, 56(%rsp) #[spill]
# LOE rbx r12 r13 r14 r15
..B7.33: # Preds ..B7.35 ..B7.32
# Execution count [4.20e+00]
movq %r15, %rdi #154.13
xorl %esi, %esi #154.13
movq %r12, %rdx #154.13
vzeroupper #154.13
call __intel_skx_avx512_memset #154.13
# LOE rbx r12 r13 r14 r15
..B7.34: # Preds ..B7.33
# Execution count [4.20e+00]
incq %rbx #153.9
addq %r12, %r15 #153.9
addq %r12, %r13 #153.9
cmpq %r14, %rbx #153.9
jae ..B7.45 # Prob 18% #153.9
# LOE rbx r12 r13 r14 r15
..B7.35: # Preds ..B7.34
# Execution count [1.72e+00]
cmpl $12, 56(%rsp) #154.13[spill]
jg ..B7.33 # Prob 100% #154.13
# LOE rbx r12 r13 r14 r15
..B7.36: # Preds ..B7.35
# Execution count [0.00e+00]
vmovdqu .L_2il0floatpacket.7(%rip), %ymm0 #
movq (%rsp), %rcx #[spill]
movl 8(%rsp), %esi #[spill]
movq 48(%rsp), %rax #[spill]
movl 56(%rsp), %edx #[spill]
vpxord %zmm1, %zmm1, %zmm1 #
# LOE rax rcx rbx r12 r13 r14 r15 edx esi ymm0 zmm1
..B7.37: # Preds ..B7.36 ..B7.31
# Execution count [4.20e+00]
cmpl $8, %edx #154.13
jl ..B7.46 # Prob 10% #154.13
# LOE rax rcx rbx r12 r13 r14 r15 edx esi ymm0 zmm1
..B7.38: # Preds ..B7.37
# Execution count [4.20e+00]
movl %esi, %r8d #154.13
xorl %r9d, %r9d #154.13
# LOE rax rcx rbx r9 r12 r13 r14 r15 edx esi r8d ymm0 zmm1
..B7.39: # Preds ..B7.39 ..B7.38
# Execution count [2.33e+01]
vmovupd %zmm1, (%r15,%r9,8) #155.17
addq $8, %r9 #154.13
cmpq %rcx, %r9 #154.13
jb ..B7.39 # Prob 81% #154.13
# LOE rax rcx rbx r9 r12 r13 r14 r15 edx esi r8d ymm0 zmm1
..B7.41: # Preds ..B7.39 ..B7.46
# Execution count [4.67e+00]
lea 1(%r8), %r9d #154.13
cmpl %edx, %r9d #154.13
ja ..B7.43 # Prob 50% #154.13
# LOE rax rcx rbx r12 r13 r14 r15 edx esi r8d ymm0 zmm1
..B7.42: # Preds ..B7.41
# Execution count [2.33e+01]
movl %edx, %r9d #154.13
subl %r8d, %r9d #154.13
vpbroadcastd %r9d, %ymm2 #154.13
vpcmpgtd %ymm0, %ymm2, %k1 #154.13
movslq %r8d, %r8 #155.17
lea (%rax,%r8,8), %r10 #132.21
vmovupd %zmm1, (%r10,%r13){%k1} #155.17
# LOE rax rcx rbx r12 r13 r14 r15 edx esi ymm0 zmm1
..B7.43: # Preds ..B7.30 ..B7.41 ..B7.42
# Execution count [0.00e+00]
incq %rbx #153.9
addq %r12, %r15 #153.9
addq %r12, %r13 #153.9
cmpq %r14, %rbx #153.9
jb ..B7.30 # Prob 82% #153.9
# LOE rax rcx rbx r12 r13 r14 r15 edx esi ymm0 zmm1
..B7.45: # Preds ..B7.74 ..B7.70 ..B7.34 ..B7.43 ..B7.28
# ..B7.48
# Execution count [1.00e+00]
vzeroupper #159.1
addq $408, %rsp #159.1
.cfi_restore 3
popq %rbx #159.1
.cfi_restore 15
popq %r15 #159.1
.cfi_restore 14
popq %r14 #159.1
.cfi_restore 13
popq %r13 #159.1
.cfi_restore 12
popq %r12 #159.1
movq %rbp, %rsp #159.1
popq %rbp #159.1
.cfi_def_cfa 7, 8
.cfi_restore 6
ret #159.1
.cfi_def_cfa 6, 16
.cfi_escape 0x10, 0x03, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd8, 0xff, 0xff, 0xff, 0x22
.cfi_offset 6, -16
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf0, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe8, 0xff, 0xff, 0xff, 0x22
.cfi_escape 0x10, 0x0f, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x22
# LOE
..B7.46: # Preds ..B7.37
# Execution count [4.20e-01]: Infreq
xorl %r8d, %r8d #154.13
jmp ..B7.41 # Prob 100% #154.13
# LOE rax rcx rbx r12 r13 r14 r15 edx esi r8d ymm0 zmm1
..B7.48: # Preds ..B7.27
# Execution count [1.60e-01]: Infreq
xorl %esi, %esi #147.9
cmpl $0, 32(%rsp) #147.36[spill]
jle ..B7.45 # Prob 10% #147.36
# LOE rax rsi ebx r14d xmm6
..B7.49: # Preds ..B7.48
# Execution count [1.44e-01]: Infreq
vmulsd .L_2il0floatpacket.19(%rip), %xmm6, %xmm1 #149.44
movl %ebx, %r8d #148.13
vmovdqu32 .L_2il0floatpacket.7(%rip), %ymm17 #148.13
vmovdqu32 .L_2il0floatpacket.6(%rip), %ymm19 #149.29
vbroadcastsd %xmm1, %zmm16 #149.44
movslq 40(%rsp), %r13 #149.17[spill]
andl $-8, %r8d #148.13
movslq %r14d, %r14 #147.9
xorl %r15d, %r15d #147.9
addq $2, %r14 #147.36
movq %rax, %r12 #147.9
movl %r8d, (%rsp) #147.9[spill]
lea 16(,%r13,8), %rdi #149.17
movq %rdi, 24(%rsp) #147.9[spill]
movq %r14, 32(%rsp) #147.9[spill]
movq %rax, %r14 #147.9
vpxord %zmm18, %zmm18, %zmm18 #149.29
# LOE rsi r12 r13 r14 r15 ebx ymm17 ymm19 zmm16 zmm18
..B7.50: # Preds ..B7.70 ..B7.49
# Execution count [7.41e-01]: Infreq
testl %ebx, %ebx #148.40
jle ..B7.70 # Prob 50% #148.40
# LOE rsi r12 r13 r14 r15 ebx ymm17 ymm19 zmm16 zmm18
..B7.51: # Preds ..B7.50
# Execution count [6.90e-01]: Infreq
cmpl $8, %ebx #148.13
jl ..B7.73 # Prob 10% #148.13
# LOE rsi r12 r13 r14 r15 ebx ymm17 ymm19 zmm16 zmm18
..B7.52: # Preds ..B7.51
# Execution count [6.61e-01]: Infreq
movq %r14, 48(%rsp) #[spill]
movl %ebx, %edx #
movq 32(%rsp), %r8 #[spill]
movq %rsi, %rax #
movq 24(%rsp), %rsi #[spill]
movq %r13, %rcx #
# LOE rax rcx rsi r8 r12 r15 edx ymm17 ymm19 zmm16 zmm18
..B7.53: # Preds ..B7.74 ..B7.52
# Execution count [7.20e-01]: Infreq
cmpl $430, %edx #148.13
jl ..B7.72 # Prob 10% #148.13
# LOE rax rcx rsi r8 r12 r15 edx ymm17 ymm19 zmm16 zmm18
..B7.54: # Preds ..B7.53
# Execution count [7.20e-01]: Infreq
movq %r12, %r13 #148.13
andq $63, %r13 #148.13
testl $7, %r13d #148.13
je ..B7.56 # Prob 50% #148.13
# LOE rax rcx rsi r8 r12 r15 edx r13d ymm17 ymm19 zmm16 zmm18
..B7.55: # Preds ..B7.54
# Execution count [3.60e-01]: Infreq
xorl %r13d, %r13d #148.13
jmp ..B7.58 # Prob 100% #148.13
# LOE rax rcx rsi r8 r12 r15 edx r13d ymm17 ymm19 zmm16 zmm18
..B7.56: # Preds ..B7.54
# Execution count [3.60e-01]: Infreq
testl %r13d, %r13d #148.13
je ..B7.58 # Prob 50% #148.13
# LOE rax rcx rsi r8 r12 r15 edx r13d ymm17 ymm19 zmm16 zmm18
..B7.57: # Preds ..B7.56
# Execution count [4.00e+00]: Infreq
negl %r13d #148.13
addl $64, %r13d #148.13
shrl $3, %r13d #148.13
cmpl %r13d, %edx #148.13
cmovl %edx, %r13d #148.13
# LOE rax rcx rsi r8 r12 r15 edx r13d ymm17 ymm19 zmm16 zmm18
..B7.58: # Preds ..B7.55 ..B7.57 ..B7.56
# Execution count [8.00e-01]: Infreq
movl %edx, %edi #148.13
subl %r13d, %edi #148.13
andl $7, %edi #148.13
negl %edi #148.13
addl %edx, %edi #148.13
cmpl $1, %r13d #148.13
jb ..B7.63 # Prob 50% #148.13
# LOE rax rcx rsi r8 r12 r15 edx edi r13d ymm17 ymm19 zmm16 zmm18
..B7.60: # Preds ..B7.58
# Execution count [7.20e-01]: Infreq
vmovdqa32 %ymm17, %ymm21 #148.13
xorl %ebx, %ebx #148.13
vpbroadcastd %r13d, %ymm20 #148.13
movslq %r13d, %r14 #148.13
movq %rcx, 16(%rsp) #148.13[spill]
movq %r8, 32(%rsp) #148.13[spill]
movq %rax, 8(%rsp) #148.13[spill]
movl %edx, 56(%rsp) #148.13[spill]
# LOE rbx rsi r12 r14 r15 edi r13d ymm17 ymm19 ymm20 ymm21 zmm16 zmm18
..B7.61: # Preds ..B7.88 ..B7.60
# Execution count [4.00e+00]: Infreq
vpcmpgtd %ymm21, %ymm20, %k4 #148.13
vmovaps %zmm18, %zmm0 #149.29
kmovw %k4, %k1 #149.29
vcvtdq2pd %ymm21, %zmm2 #149.44
vmulpd %zmm2, %zmm16, %zmm1 #149.48
..___tag_value_initSolver.721:
call *__svml_sin8_mask_z0@GOTPCREL(%rip) #149.29
..___tag_value_initSolver.722:
# LOE rbx rsi r12 r14 r15 edi r13d ymm17 ymm19 ymm20 ymm21 zmm0 zmm16 zmm18 k4
..B7.88: # Preds ..B7.61
# Execution count [4.00e+00]: Infreq
vpaddd %ymm19, %ymm21, %ymm21 #148.13
vmovupd %zmm0, (%r12,%rbx,8){%k4} #149.17
addq $8, %rbx #148.13
cmpq %r14, %rbx #148.13
jb ..B7.61 # Prob 82% #148.13
# LOE rbx rsi r12 r14 r15 edi r13d ymm17 ymm19 ymm20 ymm21 zmm16 zmm18
..B7.62: # Preds ..B7.88
# Execution count [7.20e-01]: Infreq
movl 56(%rsp), %edx #[spill]
movq 16(%rsp), %rcx #[spill]
movq 32(%rsp), %r8 #[spill]
movq 8(%rsp), %rax #[spill]
cmpl %r13d, %edx #148.13
je ..B7.74 # Prob 10% #148.13
# LOE rax rcx rsi r8 r12 r15 edx edi r13d ymm17 ymm19 zmm16 zmm18
..B7.63: # Preds ..B7.58 ..B7.62
# Execution count [6.48e-01]: Infreq
movq %rsi, 24(%rsp) #[spill]
movq %rax, %rsi #
movq %r8, 32(%rsp) #[spill]
movl %r13d, %eax #
movq 48(%rsp), %r14 #[spill]
movq %rcx, %r13 #
movl %edx, %ebx #
# LOE rsi r12 r13 r14 r15 eax ebx edi ymm17 ymm19 zmm16 zmm18
..B7.64: # Preds ..B7.63 ..B7.72
# Execution count [4.00e+00]: Infreq
vpbroadcastd %eax, %ymm1 #149.29
lea 8(%rax), %r8d #148.13
vpaddd .L_2il0floatpacket.20(%rip), %ymm1, %ymm20 #149.29
cmpl %r8d, %edi #148.13
jl ..B7.68 # Prob 50% #148.13
# LOE rsi r12 r13 r14 r15 eax ebx edi ymm17 ymm19 ymm20 zmm16 zmm18
..B7.65: # Preds ..B7.64
# Execution count [7.20e-01]: Infreq
movslq %eax, %rdx #148.13
movq %r14, 48(%rsp) #148.13[spill]
movl %eax, %r14d #148.13
movl %ebx, 56(%rsp) #148.13[spill]
movq %rdx, %rbx #148.13
# LOE rbx rsi r12 r13 r15 edi r14d ymm17 ymm19 ymm20 zmm16 zmm18
..B7.66: # Preds ..B7.89 ..B7.65
# Execution count [4.00e+00]: Infreq
vcvtdq2pd %ymm20, %zmm1 #149.44
vmulpd %zmm1, %zmm16, %zmm0 #149.48
..___tag_value_initSolver.732:
call *__svml_sin8_z0@GOTPCREL(%rip) #149.29
..___tag_value_initSolver.733:
# LOE rbx rsi r12 r13 r15 edi r14d ymm17 ymm19 ymm20 zmm0 zmm16 zmm18
..B7.89: # Preds ..B7.66
# Execution count [4.00e+00]: Infreq
addl $8, %r14d #148.13
vpaddd %ymm19, %ymm20, %ymm20 #149.29
vmovupd %zmm0, (%r12,%rbx,8) #149.17
addq $8, %rbx #148.13
cmpl %edi, %r14d #148.13
jb ..B7.66 # Prob 82% #148.13
# LOE rbx rsi r12 r13 r15 edi r14d ymm17 ymm19 ymm20 zmm16 zmm18
..B7.67: # Preds ..B7.89
# Execution count [7.20e-01]: Infreq
movq 48(%rsp), %r14 #[spill]
movl 56(%rsp), %ebx #[spill]
# LOE rsi r12 r13 r14 r15 ebx edi ymm17 ymm19 zmm16 zmm18
..B7.68: # Preds ..B7.67 ..B7.64 ..B7.73
# Execution count [8.00e-01]: Infreq
lea 1(%rdi), %r8d #148.13
cmpl %ebx, %r8d #148.13
ja ..B7.70 # Prob 50% #148.13
# LOE rsi r12 r13 r14 r15 ebx edi ymm17 ymm19 zmm16 zmm18
..B7.69: # Preds ..B7.68
# Execution count [4.00e+00]: Infreq
vpbroadcastd %edi, %ymm2 #149.29
movl %ebx, %r8d #148.13
vpaddd .L_2il0floatpacket.20(%rip), %ymm2, %ymm3 #149.29
subl %edi, %r8d #148.13
vpbroadcastd %r8d, %ymm5 #148.13
vpcmpgtd %ymm17, %ymm5, %k4 #148.13
vmovaps %zmm18, %zmm0 #149.29
kmovw %k4, %k1 #149.29
vcvtdq2pd %ymm3, %zmm4 #149.44
vmulpd %zmm4, %zmm16, %zmm1 #149.48
..___tag_value_initSolver.736:
call *__svml_sin8_mask_z0@GOTPCREL(%rip) #149.29
..___tag_value_initSolver.737:
# LOE rsi r12 r13 r14 r15 ebx edi ymm17 ymm19 zmm0 zmm16 zmm18 k4
..B7.90: # Preds ..B7.69
# Execution count [4.00e+00]: Infreq
movslq %edi, %rdi #149.17
addq %r15, %rdi #149.17
vmovupd %zmm0, (%r14,%rdi,8){%k4} #149.17
# LOE rsi r12 r13 r14 r15 ebx ymm17 ymm19 zmm16 zmm18
..B7.70: # Preds ..B7.68 ..B7.50 ..B7.90
# Execution count [7.28e-01]: Infreq
incq %rsi #147.9
lea 2(%r15,%r13), %r15 #147.9
addq 24(%rsp), %r12 #147.9[spill]
cmpq 32(%rsp), %rsi #147.9[spill]
jb ..B7.50 # Prob 82% #147.9
jmp ..B7.45 # Prob 100% #147.9
# LOE rsi r12 r13 r14 r15 ebx ymm17 ymm19 zmm16 zmm18
..B7.72: # Preds ..B7.53
# Execution count [7.20e-02]: Infreq
movq %rsi, 24(%rsp) #[spill]
movq %rax, %rsi #
movq %r8, 32(%rsp) #[spill]
movl %edx, %ebx #
movq 48(%rsp), %r14 #[spill]
movq %rcx, %r13 #
movl (%rsp), %edi #148.13[spill]
xorl %eax, %eax #148.13
jmp ..B7.64 # Prob 100% #148.13
# LOE rsi r12 r13 r14 r15 eax ebx edi ymm17 ymm19 zmm16 zmm18
..B7.73: # Preds ..B7.51
# Execution count [7.20e-02]: Infreq
xorl %edi, %edi #148.13
jmp ..B7.68 # Prob 100% #148.13
# LOE rsi r12 r13 r14 r15 ebx edi ymm17 ymm19 zmm16 zmm18
..B7.74: # Preds ..B7.62
# Execution count [7.20e-02]: Infreq
incq %rax #147.9
addq %rsi, %r12 #147.9
lea 2(%r15,%rcx), %r15 #147.9
cmpq %r8, %rax #147.9
jb ..B7.53 # Prob 82% #147.9
jmp ..B7.45 # Prob 100% #147.9
# LOE rax rcx rsi r8 r12 r15 edx ymm17 ymm19 zmm16 zmm18
..B7.76: # Preds ..B7.10
# Execution count [4.50e-01]: Infreq
movl (%rsp), %r14d #141.9[spill]
xorl %r15d, %r15d #141.9
jmp ..B7.19 # Prob 100% #141.9
# LOE r12 r13 ebx r14d r15d
..B7.77: # Preds ..B7.9
# Execution count [4.50e-01]: Infreq
xorl %r14d, %r14d #141.9
jmp ..B7.23 # Prob 100% #141.9
.align 16,0x90
# LOE r12 r13 ebx r14d
.cfi_endproc
# mark_end;
.type initSolver,@function
.size initSolver,.-initSolver
..LNinitSolver.6:
.data
# -- End initSolver
.section .rodata, "a"
.align 64
.align 64
.L_2il0floatpacket.0:
.long 0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010,0x00000010
.type .L_2il0floatpacket.0,@object
.size .L_2il0floatpacket.0,64
.align 64
.L_2il0floatpacket.1:
.long 0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001,0x00000001
.type .L_2il0floatpacket.1,@object
.size .L_2il0floatpacket.1,64
.align 64
.L_2il0floatpacket.2:
.long 0x00000000,0x00000001,0x00000002,0x00000003,0x00000004,0x00000005,0x00000006,0x00000007,0x00000008,0x00000009,0x0000000a,0x0000000b,0x0000000c,0x0000000d,0x0000000e,0x0000000f
.type .L_2il0floatpacket.2,@object
.size .L_2il0floatpacket.2,64
.align 64
.L_2il0floatpacket.3:
.long 0x00000001,0x00000002,0x00000003,0x00000004,0x00000005,0x00000006,0x00000007,0x00000008,0x00000009,0x0000000a,0x0000000b,0x0000000c,0x0000000d,0x0000000e,0x0000000f,0x00000010
.type .L_2il0floatpacket.3,@object
.size .L_2il0floatpacket.3,64
.align 64
.L_2il0floatpacket.4:
.long 0x00000000,0x00000001,0x00000002,0x00000003,0x00000004,0x00000005,0x00000006,0x00000007,0x00000008,0x00000009,0x0000000a,0x0000000b,0x0000000c,0x0000000d,0x0000000e,0x0000000f
.type .L_2il0floatpacket.4,@object
.size .L_2il0floatpacket.4,64
.align 64
.L_2il0floatpacket.11:
.long 0x00000000,0x00000000,0x00000002,0x00000000,0x00000004,0x00000000,0x00000006,0x00000000,0x00000008,0x00000000,0x0000000a,0x00000000,0x0000000c,0x00000000,0x0000000e,0x00000000
.type .L_2il0floatpacket.11,@object
.size .L_2il0floatpacket.11,64
.align 64
.L_2il0floatpacket.12:
.long 0x00000001,0x00000000,0x00000003,0x00000000,0x00000005,0x00000000,0x00000007,0x00000000,0x00000009,0x00000000,0x0000000b,0x00000000,0x0000000d,0x00000000,0x0000000f,0x00000000
.type .L_2il0floatpacket.12,@object
.size .L_2il0floatpacket.12,64
.align 64
.L_2il0floatpacket.13:
.long 0x00000000,0x40000000,0x00000000,0x40000000,0x00000000,0x40000000,0x00000000,0x40000000,0x00000000,0x40000000,0x00000000,0x40000000,0x00000000,0x40000000,0x00000000,0x40000000
.type .L_2il0floatpacket.13,@object
.size .L_2il0floatpacket.13,64
.align 64
.L_2il0floatpacket.14:
.long 0x00000000,0x00000000,0x00000002,0x00000000,0x00000004,0x00000000,0x00000006,0x00000000,0x00000008,0x00000000,0x0000000a,0x00000000,0x0000000c,0x00000000,0x0000000e,0x00000000
.type .L_2il0floatpacket.14,@object
.size .L_2il0floatpacket.14,64
.align 64
.L_2il0floatpacket.15:
.long 0x00000000,0x00000000,0x00000000,0x00000000,0x00000001,0x00000000,0x00000000,0x00000000,0x00000002,0x00000000,0x00000000,0x00000000,0x00000003,0x00000000,0x00000000,0x00000000
.type .L_2il0floatpacket.15,@object
.size .L_2il0floatpacket.15,64
.align 64
.L_2il0floatpacket.16:
.long 0x00000004,0x00000000,0x00000000,0x00000000,0x00000005,0x00000000,0x00000000,0x00000000,0x00000006,0x00000000,0x00000000,0x00000000,0x00000007,0x00000000,0x00000000,0x00000000
.type .L_2il0floatpacket.16,@object
.size .L_2il0floatpacket.16,64
.align 64
.L_2il0floatpacket.17:
.long 0x00020001,0x00080004,0x00200010,0x00800040,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000,0x00000000
.type .L_2il0floatpacket.17,@object
.size .L_2il0floatpacket.17,64
.align 32
.L_2il0floatpacket.6:
.long 0x00000008,0x00000008,0x00000008,0x00000008,0x00000008,0x00000008,0x00000008,0x00000008
.type .L_2il0floatpacket.6,@object
.size .L_2il0floatpacket.6,32
.align 32
.L_2il0floatpacket.7:
.long 0x00000000,0x00000001,0x00000002,0x00000003,0x00000004,0x00000005,0x00000006,0x00000007
.type .L_2il0floatpacket.7,@object
.size .L_2il0floatpacket.7,32
.align 32
.L_2il0floatpacket.20:
.long 0x00000000,0x00000001,0x00000002,0x00000003,0x00000004,0x00000005,0x00000006,0x00000007
.type .L_2il0floatpacket.20,@object
.size .L_2il0floatpacket.20,32
.align 8
.L_2il0floatpacket.5:
.long 0x00000000,0x3fe00000
.type .L_2il0floatpacket.5,@object
.size .L_2il0floatpacket.5,8
.align 8
.L_2il0floatpacket.8:
.long 0x00000000,0x40000000
.type .L_2il0floatpacket.8,@object
.size .L_2il0floatpacket.8,8
.align 8
.L_2il0floatpacket.9:
.long 0x00000000,0x3ff00000
.type .L_2il0floatpacket.9,@object
.size .L_2il0floatpacket.9,8
.align 8
.L_2il0floatpacket.10:
.long 0x00000000,0x3fd00000
.type .L_2il0floatpacket.10,@object
.size .L_2il0floatpacket.10,8
.align 8
.L_2il0floatpacket.18:
.long 0x54442d18,0x402921fb
.type .L_2il0floatpacket.18,@object
.size .L_2il0floatpacket.18,8
.align 8
.L_2il0floatpacket.19:
.long 0x54442d18,0x401921fb
.type .L_2il0floatpacket.19,@object
.size .L_2il0floatpacket.19,8
.section .rodata.str1.4, "aMS",@progbits,1
.space 1, 0x00 # pad
.align 4
.L_2__STRING.4:
.long 1633955440
.word 116
.type .L_2__STRING.4,@object
.size .L_2__STRING.4,6
.space 2, 0x00 # pad
.align 4
.L_2__STRING.9:
.word 119
.type .L_2__STRING.9,@object
.size .L_2__STRING.9,2
.space 2, 0x00 # pad
.align 4
.L_2__STRING.11:
.long 2123301
.type .L_2__STRING.11,@object
.size .L_2__STRING.11,4
.align 4
.L_2__STRING.1:
.long 1681010725
.word 8250
.byte 0
.type .L_2__STRING.1,@object
.size .L_2__STRING.1,7
.space 1, 0x00 # pad
.align 4
.L_2__STRING.2:
.long 775041317
.long 538994232
.byte 0
.type .L_2__STRING.2,@object
.size .L_2__STRING.2,9
.space 3, 0x00 # pad
.align 4
.L_2__STRING.6:
.long 1986817875
.long 1948283493
.long 543911791
.long 1763730469
.long 1634887028
.long 1852795252
.word 2675
.byte 0
.type .L_2__STRING.6,@object
.size .L_2__STRING.6,27
.space 1, 0x00 # pad
.align 4
.L_2__STRING.7:
.long 1634625862
.long 1835999340
.long 979461989
.long 174466336
.byte 0
.type .L_2__STRING.7,@object
.size .L_2__STRING.7,17
.space 3, 0x00 # pad
.align 4
.L_2__STRING.8:
.long 1986817875
.long 1948283493
.long 543911791
.long 1763730469
.long 1634887028
.long 1852795252
.long 1869881459
.long 1634038304
.long 622880867
.word 2662
.byte 0
.type .L_2__STRING.8,@object
.size .L_2__STRING.8,39
.space 1, 0x00 # pad
.align 4
.L_2__STRING.5:
.long 1263419730
.long 979641632
.long 1634560288
.long 1668238456
.long 975203425
.long 744760608
.long 1634560544
.long 1668238456
.long 975203425
.long 174335264
.byte 0
.type .L_2__STRING.5,@object
.size .L_2__STRING.5,41
.section .rodata.str1.32, "aMS",@progbits,1
.align 32
.align 32
.L_2__STRING.0:
.long 539173667
.long 1263419730
.long 543434016
.long 589505315
.long 589505315
.long 589505315
.long 589505315
.long 589505315
.long 589505315
.long 589505315
.long 589505315
.long 589505315
.long 589505315
.long 589505315
.long 589505315
.long 589505315
.long 170074915
.byte 0
.type .L_2__STRING.0,@object
.size .L_2__STRING.0,69
.data
.section .note.GNU-stack, ""
# End