NuSiF-Solver/PoissonSolver/2D-mpi/ICC/main.s

322 lines
15 KiB
ArmAsm

# mark_description "Intel(R) C Intel(R) 64 Compiler Classic for applications running on Intel(R) 64, Version 2021.10.0 Build 202";
# mark_description "30609_000000";
# mark_description "-I./src/includes -I./ICC -I/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-mpi-2021.1";
# mark_description "0.0-ki6gcj4pr5rekayazvm4lsmvcyosce25/mpi/2021.10.0/include -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux";
# mark_description "8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux";
# mark_description "/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-ax";
# mark_description "ze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/x64 -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almal";
# mark_description "inux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/l";
# mark_description "inux/lib/oclfpga/host/linux64/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel";
# mark_description "-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/oclfpga/linux64/lib ";
# mark_description "-Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7oc";
# mark_description "bc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/compiler/lib/intel64_lin -gcc-name=/usr/bin/gcc -gxx-name=";
# mark_description "/usr/bin/g++ -S -fverbose-asm -D_GNU_SOURCE -DARRAY_ALIGNMENT=64 -O3 -xHost -qopt-zmm-usage=high -std=c99 -o";
# mark_description " ICC/main.s";
.file "main.c"
.text
..TXTST0:
.L_2__routine_start_main_0:
# -- Begin main
.text
# mark_begin;
.align 16,0x90
.globl main
# --- main(int, char **)
main:
# parameter 1: %edi
# parameter 2: %rsi
..B1.1: # Preds ..B1.0
# Execution count [1.00e+00]
.cfi_startproc
..___tag_value_main.1:
..L2:
#21.1
pushq %rbp #21.1
.cfi_def_cfa_offset 16
movq %rsp, %rbp #21.1
.cfi_def_cfa 6, 16
.cfi_offset 6, -16
andq $-128, %rsp #21.1
pushq %r12 #21.1
subq $248, %rsp #21.1
movl %edi, 184(%rsp) #21.1
movl $3, %edi #21.1
movq %rsi, 168(%rsp) #21.1
movq $0x64199d9ffe, %rsi #21.1
call __intel_new_feature_proc_init #21.1
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0x80, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
# LOE rbx r13 r14 r15
..B1.31: # Preds ..B1.1
# Execution count [1.00e+00]
vstmxcsr (%rsp) #21.1
movl $2, %r12d #23.17
lea 184(%rsp), %rdi #30.5
orl $32832, (%rsp) #21.1
lea 168(%rsp), %rsi #30.5
vldmxcsr (%rsp) #21.1
..___tag_value_main.7:
# MPI_Init(int *, char ***)
call MPI_Init #30.5
..___tag_value_main.8:
# LOE rbx r13 r14 r15 r12d
..B1.2: # Preds ..B1.31
# Execution count [1.00e+00]
movl $1140850688, %edi #31.5
lea 176(%rsp), %rsi #31.5
..___tag_value_main.9:
# MPI_Comm_rank(MPI_Comm, int *)
call MPI_Comm_rank #31.5
..___tag_value_main.10:
# LOE rbx r13 r14 r15 r12d
..B1.3: # Preds ..B1.2
# Execution count [1.00e+00]
lea 96(%rsp), %rdi #32.5
..___tag_value_main.11:
# initParameter(Parameter *)
call initParameter #32.5
..___tag_value_main.12:
# LOE rbx r13 r14 r15 r12d
..B1.4: # Preds ..B1.3
# Execution count [1.00e+00]
cmpl $2, 184(%rsp) #34.16
jge ..B1.7 # Prob 50% #34.16
# LOE rbx r13 r14 r15 r12d
..B1.5: # Preds ..B1.4
# Execution count [5.00e-01]
movq 168(%rsp), %rax #35.9
movl $.L_2__STRING.0, %edi #35.9
movq (%rax), %rsi #35.9
xorl %eax, %eax #35.9
..___tag_value_main.13:
# printf(const char *__restrict__, ...)
call printf #35.9
..___tag_value_main.14:
# LOE
..B1.6: # Preds ..B1.5
# Execution count [5.00e-01]
xorl %edi, %edi #36.9
# exit(int)
call exit #36.9
# LOE
..B1.7: # Preds ..B1.4
# Execution count [5.00e-01]
movq 168(%rsp), %rax #39.5
lea 96(%rsp), %rdi #39.5
movq 8(%rax), %rsi #39.5
..___tag_value_main.15:
# readParameter(Parameter *, const char *)
call readParameter #39.5
..___tag_value_main.16:
# LOE rbx r13 r14 r15 r12d
..B1.8: # Preds ..B1.7
# Execution count [5.00e-01]
cmpl $3, 184(%rsp) #40.17
je ..B1.27 # Prob 16% #40.17
# LOE rbx r13 r14 r15 r12d
..B1.9: # Preds ..B1.28 ..B1.8
# Execution count [5.00e-01]
cmpl $0, 176(%rsp) #44.17
jne ..B1.11 # Prob 78% #44.17
# LOE rbx r13 r14 r15 r12d
..B1.10: # Preds ..B1.9
# Execution count [1.10e-01]
lea 96(%rsp), %rdi #45.9
..___tag_value_main.17:
# printParameter(Parameter *)
call printParameter #45.9
..___tag_value_main.18:
# LOE rbx r13 r14 r15 r12d
..B1.11: # Preds ..B1.10 ..B1.9
# Execution count [5.00e-01]
movl $2, %edx #48.5
lea (%rsp), %rdi #48.5
lea 96(%rsp), %rsi #48.5
..___tag_value_main.19:
# initSolver(Solver *, Parameter *, int)
call initSolver #48.5
..___tag_value_main.20:
# LOE rbx r13 r14 r15 r12d
..B1.12: # Preds ..B1.11
# Execution count [5.00e-01]
xorl %eax, %eax #50.9
..___tag_value_main.21:
# getTimeStamp()
call getTimeStamp #50.9
..___tag_value_main.22:
# LOE rbx r13 r14 r15 r12d xmm0
..B1.32: # Preds ..B1.12
# Execution count [5.00e-01]
vmovsd %xmm0, 160(%rsp) #50.9[spill]
# LOE rbx r13 r14 r15 r12d
..B1.13: # Preds ..B1.32
# Execution count [5.00e-01]
cmpl $1, %r12d #52.13
je ..B1.20 # Prob 25% #52.13
# LOE rbx r13 r14 r15 r12d
..B1.14: # Preds ..B1.13
# Execution count [3.75e-01]
cmpl $2, %r12d #52.13
jne ..B1.17 # Prob 66% #52.13
# LOE rbx r13 r14 r15 r12d
..B1.15: # Preds ..B1.14
# Execution count [1.25e-01]
movl $il0_peep_printf_format_1, %edi #58.9
call puts #58.9
# LOE rbx r13 r14 r15
..B1.16: # Preds ..B1.15
# Execution count [1.25e-01]
lea (%rsp), %rdi #59.9
..___tag_value_main.24:
# solveRB(Solver *)
call solveRB #59.9
..___tag_value_main.25:
jmp ..B1.22 # Prob 100% #59.9
# LOE rbx r13 r14 r15
..B1.17: # Preds ..B1.14
# Execution count [2.50e-01]
cmpl $3, %r12d #52.13
jne ..B1.22 # Prob 50% #52.13
# LOE rbx r13 r14 r15
..B1.18: # Preds ..B1.17
# Execution count [1.25e-01]
movl $il0_peep_printf_format_0, %edi #62.9
call puts #62.9
# LOE rbx r13 r14 r15
..B1.19: # Preds ..B1.18
# Execution count [1.25e-01]
lea (%rsp), %rdi #63.9
..___tag_value_main.26:
# solveRBA(Solver *)
call solveRBA #63.9
..___tag_value_main.27:
jmp ..B1.22 # Prob 100% #63.9
# LOE rbx r13 r14 r15
..B1.20: # Preds ..B1.13
# Execution count [1.25e-01]
movl $il0_peep_printf_format_2, %edi #54.9
call puts #54.9
# LOE rbx r13 r14 r15
..B1.21: # Preds ..B1.20
# Execution count [1.25e-01]
lea (%rsp), %rdi #55.9
..___tag_value_main.28:
# solve(Solver *)
call solve #55.9
..___tag_value_main.29:
# LOE rbx r13 r14 r15
..B1.22: # Preds ..B1.21 ..B1.16 ..B1.19 ..B1.17
# Execution count [5.00e-01]
xorl %eax, %eax #68.9
..___tag_value_main.30:
# getTimeStamp()
call getTimeStamp #68.9
..___tag_value_main.31:
# LOE rbx r13 r14 r15 xmm0
..B1.23: # Preds ..B1.22
# Execution count [5.00e-01]
cmpl $0, 176(%rsp) #70.17
jne ..B1.25 # Prob 78% #70.17
# LOE rbx r13 r14 r15 xmm0
..B1.24: # Preds ..B1.23
# Execution count [1.10e-01]
movl $.L_2__STRING.4, %edi #71.9
movl $1, %eax #71.9
vsubsd 160(%rsp), %xmm0, %xmm0 #71.9[spill]
..___tag_value_main.32:
# printf(const char *__restrict__, ...)
call printf #71.9
..___tag_value_main.33:
# LOE rbx r13 r14 r15
..B1.25: # Preds ..B1.24 ..B1.23
# Execution count [5.00e-01]
..___tag_value_main.35:
# MPI_Finalize(void)
call MPI_Finalize #74.5
..___tag_value_main.36:
# LOE rbx r13 r14 r15
..B1.26: # Preds ..B1.25
# Execution count [5.00e-01]
xorl %eax, %eax #75.12
addq $248, %rsp #75.12
.cfi_restore 12
popq %r12 #75.12
movq %rbp, %rsp #75.12
popq %rbp #75.12
.cfi_def_cfa 7, 8
.cfi_restore 6
ret #75.12
.cfi_def_cfa 6, 16
.cfi_offset 6, -16
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0x80, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
# LOE
..B1.27: # Preds ..B1.8
# Execution count [8.00e-02]: Infreq
movq 168(%rsp), %rax #41.19
movq 16(%rax), %rcx #41.19
..___tag_value_main.43:
call *__intel_sse4_atol@GOTPCREL(%rip) #41.19
..___tag_value_main.44:
# LOE rax rbx r13 r14 r15
..B1.28: # Preds ..B1.27
# Execution count [8.00e-02]: Infreq
movl %eax, %r12d #41.19
jmp ..B1.9 # Prob 100% #41.19
.align 16,0x90
# LOE rbx r13 r14 r15 r12d
.cfi_endproc
# mark_end;
.type main,@function
.size main,.-main
..LNmain.0:
.section .rodata.str1.4, "aMS",@progbits,1
.align 4
.align 4
il0_peep_printf_format_1:
.long 761554258
.long 1667329122
.long 1330847851
.word 82
.space 2, 0x00 # pad
.align 4
il0_peep_printf_format_0:
.long 761554258
.long 1667329122
.long 1330847851
.long 1769414738
.long 1629513844
.long 1818583907
.long 1952543333
.long 7237481
.align 4
il0_peep_printf_format_2:
.long 1767992400
.long 1330847854
.word 82
.data
# -- End main
.section .rodata.str1.4, "aMS",@progbits,1
.space 2, 0x00 # pad
.align 4
.L_2__STRING.0:
.long 1734439765
.long 622869093
.long 1664884851
.long 1768320623
.long 1818838631
.long 671333
.type .L_2__STRING.0,@object
.size .L_2__STRING.0,24
.align 4
.L_2__STRING.4:
.long 1970040659
.long 1852795252
.long 1869575200
.long 774185067
.long 175334962
.byte 0
.type .L_2__STRING.4,@object
.size .L_2__STRING.4,21
.data
.section .note.GNU-stack, ""
# End