Incomplete 2D-seq multigrid
This commit is contained in:
18
PoissonSolver/2D-mpi/ICC/affinity.s
Normal file
18
PoissonSolver/2D-mpi/ICC/affinity.s
Normal file
@@ -0,0 +1,18 @@
|
||||
# mark_description "Intel(R) C Intel(R) 64 Compiler Classic for applications running on Intel(R) 64, Version 2021.10.0 Build 202";
|
||||
# mark_description "30609_000000";
|
||||
# mark_description "-I./src/includes -I./ICC -I/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-mpi-2021.1";
|
||||
# mark_description "0.0-ki6gcj4pr5rekayazvm4lsmvcyosce25/mpi/2021.10.0/include -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux";
|
||||
# mark_description "8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux";
|
||||
# mark_description "/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-ax";
|
||||
# mark_description "ze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/x64 -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almal";
|
||||
# mark_description "inux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/l";
|
||||
# mark_description "inux/lib/oclfpga/host/linux64/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel";
|
||||
# mark_description "-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/oclfpga/linux64/lib ";
|
||||
# mark_description "-Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7oc";
|
||||
# mark_description "bc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/compiler/lib/intel64_lin -gcc-name=/usr/bin/gcc -gxx-name=";
|
||||
# mark_description "/usr/bin/g++ -S -fverbose-asm -D_GNU_SOURCE -DARRAY_ALIGNMENT=64 -O3 -xHost -qopt-zmm-usage=high -std=c99 -o";
|
||||
# mark_description " ICC/affinity.s";
|
||||
.file "affinity.c"
|
||||
.data
|
||||
.section .note.GNU-stack, ""
|
||||
# End
|
152
PoissonSolver/2D-mpi/ICC/allocate.s
Normal file
152
PoissonSolver/2D-mpi/ICC/allocate.s
Normal file
@@ -0,0 +1,152 @@
|
||||
# mark_description "Intel(R) C Intel(R) 64 Compiler Classic for applications running on Intel(R) 64, Version 2021.10.0 Build 202";
|
||||
# mark_description "30609_000000";
|
||||
# mark_description "-I./src/includes -I./ICC -I/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-mpi-2021.1";
|
||||
# mark_description "0.0-ki6gcj4pr5rekayazvm4lsmvcyosce25/mpi/2021.10.0/include -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux";
|
||||
# mark_description "8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux";
|
||||
# mark_description "/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-ax";
|
||||
# mark_description "ze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/x64 -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almal";
|
||||
# mark_description "inux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/l";
|
||||
# mark_description "inux/lib/oclfpga/host/linux64/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel";
|
||||
# mark_description "-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/oclfpga/linux64/lib ";
|
||||
# mark_description "-Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7oc";
|
||||
# mark_description "bc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/compiler/lib/intel64_lin -gcc-name=/usr/bin/gcc -gxx-name=";
|
||||
# mark_description "/usr/bin/g++ -S -fverbose-asm -D_GNU_SOURCE -DARRAY_ALIGNMENT=64 -O3 -xHost -qopt-zmm-usage=high -std=c99 -o";
|
||||
# mark_description " ICC/allocate.s";
|
||||
.file "allocate.c"
|
||||
.text
|
||||
..TXTST0:
|
||||
.L_2__routine_start_allocate_0:
|
||||
# -- Begin allocate
|
||||
.text
|
||||
# mark_begin;
|
||||
.align 16,0x90
|
||||
.globl allocate
|
||||
# --- allocate(int, size_t)
|
||||
allocate:
|
||||
# parameter 1: %edi
|
||||
# parameter 2: %rsi
|
||||
..B1.1: # Preds ..B1.0
|
||||
# Execution count [1.00e+00]
|
||||
.cfi_startproc
|
||||
..___tag_value_allocate.1:
|
||||
..L2:
|
||||
#12.1
|
||||
pushq %rsi #12.1
|
||||
.cfi_def_cfa_offset 16
|
||||
movq %rsi, %rdx #12.1
|
||||
movslq %edi, %rsi #16.18
|
||||
lea (%rsp), %rdi #16.18
|
||||
# posix_memalign(void **, size_t, size_t)
|
||||
call posix_memalign #16.18
|
||||
# LOE rbx rbp r12 r13 r14 r15 eax
|
||||
..B1.2: # Preds ..B1.1
|
||||
# Execution count [1.00e+00]
|
||||
testl %eax, %eax #18.9
|
||||
je ..B1.5 # Prob 50% #18.9
|
||||
# LOE rbx rbp r12 r13 r14 r15 eax
|
||||
..B1.3: # Preds ..B1.2
|
||||
# Execution count [5.00e-01]
|
||||
cmpl $22, %eax #19.26
|
||||
je ..B1.9 # Prob 0% #19.26
|
||||
# LOE rbx rbp r12 r13 r14 r15 eax
|
||||
..B1.4: # Preds ..B1.3
|
||||
# Execution count [4.95e-01]
|
||||
cmpl $12, %eax #24.26
|
||||
je ..B1.7 # Prob 0% #24.26
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.5: # Preds ..B1.4 ..B1.2
|
||||
# Execution count [9.90e-01]
|
||||
movq (%rsp), %rax #31.9
|
||||
testq %rax, %rax #31.16
|
||||
je ..B1.11 # Prob 1% #31.16
|
||||
# LOE rax rbx rbp r12 r13 r14 r15
|
||||
..B1.6: # Preds ..B1.5
|
||||
# Execution count [9.72e-01]
|
||||
popq %rcx #36.12
|
||||
.cfi_def_cfa_offset 8
|
||||
ret #36.12
|
||||
.cfi_def_cfa_offset 16
|
||||
# LOE
|
||||
..B1.7: # Preds ..B1.4
|
||||
# Execution count [4.91e-03]: Infreq
|
||||
movl $il0_peep_printf_format_1, %edi #25.13
|
||||
movq stderr(%rip), %rsi #25.13
|
||||
call fputs #25.13
|
||||
# LOE
|
||||
..B1.8: # Preds ..B1.11 ..B1.9 ..B1.7
|
||||
# Execution count [4.91e-03]: Infreq
|
||||
movl $1, %edi #27.13
|
||||
# exit(int)
|
||||
call exit #27.13
|
||||
# LOE
|
||||
..B1.9: # Preds ..B1.3
|
||||
# Execution count [4.96e-03]: Infreq
|
||||
movl $il0_peep_printf_format_2, %edi #20.13
|
||||
movq stderr(%rip), %rsi #20.13
|
||||
call fputs #20.13
|
||||
jmp ..B1.8 # Prob 100% #20.13
|
||||
# LOE
|
||||
..B1.11: # Preds ..B1.5
|
||||
# Execution count [1.79e-02]: Infreq
|
||||
movl $il0_peep_printf_format_0, %edi #32.9
|
||||
movq stderr(%rip), %rsi #32.9
|
||||
call fputs #32.9
|
||||
jmp ..B1.8 # Prob 100% #32.9
|
||||
.align 16,0x90
|
||||
# LOE
|
||||
.cfi_endproc
|
||||
# mark_end;
|
||||
.type allocate,@function
|
||||
.size allocate,.-allocate
|
||||
..LNallocate.0:
|
||||
.section .rodata.str1.4, "aMS",@progbits,1
|
||||
.align 4
|
||||
.align 4
|
||||
il0_peep_printf_format_1:
|
||||
.long 1869771333
|
||||
.long 1226848882
|
||||
.long 1718973294
|
||||
.long 1768122726
|
||||
.long 544501349
|
||||
.long 1869440365
|
||||
.long 1948285298
|
||||
.long 1969627247
|
||||
.long 1818846828
|
||||
.long 1752440940
|
||||
.long 1701978213
|
||||
.long 1936029041
|
||||
.word 2676
|
||||
.byte 0
|
||||
.space 1, 0x00 # pad
|
||||
.align 4
|
||||
il0_peep_printf_format_2:
|
||||
.long 1869771333
|
||||
.long 1092631154
|
||||
.long 1852270956
|
||||
.long 1953391981
|
||||
.long 1918988320
|
||||
.long 1952804193
|
||||
.long 1763734117
|
||||
.long 1869488243
|
||||
.long 543236212
|
||||
.long 1702326128
|
||||
.long 1718558834
|
||||
.long 1870099488
|
||||
.word 10
|
||||
.space 2, 0x00 # pad
|
||||
.align 4
|
||||
il0_peep_printf_format_0:
|
||||
.long 1869771333
|
||||
.long 1881160306
|
||||
.long 2020176751
|
||||
.long 1835363679
|
||||
.long 1734962273
|
||||
.long 1634082926
|
||||
.long 1684368489
|
||||
.word 2593
|
||||
.byte 0
|
||||
.data
|
||||
# -- End allocate
|
||||
.data
|
||||
.section .note.GNU-stack, ""
|
||||
# End
|
321
PoissonSolver/2D-mpi/ICC/main.s
Normal file
321
PoissonSolver/2D-mpi/ICC/main.s
Normal file
@@ -0,0 +1,321 @@
|
||||
# mark_description "Intel(R) C Intel(R) 64 Compiler Classic for applications running on Intel(R) 64, Version 2021.10.0 Build 202";
|
||||
# mark_description "30609_000000";
|
||||
# mark_description "-I./src/includes -I./ICC -I/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-mpi-2021.1";
|
||||
# mark_description "0.0-ki6gcj4pr5rekayazvm4lsmvcyosce25/mpi/2021.10.0/include -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux";
|
||||
# mark_description "8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux";
|
||||
# mark_description "/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-ax";
|
||||
# mark_description "ze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/x64 -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almal";
|
||||
# mark_description "inux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/l";
|
||||
# mark_description "inux/lib/oclfpga/host/linux64/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel";
|
||||
# mark_description "-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/oclfpga/linux64/lib ";
|
||||
# mark_description "-Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7oc";
|
||||
# mark_description "bc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/compiler/lib/intel64_lin -gcc-name=/usr/bin/gcc -gxx-name=";
|
||||
# mark_description "/usr/bin/g++ -S -fverbose-asm -D_GNU_SOURCE -DARRAY_ALIGNMENT=64 -O3 -xHost -qopt-zmm-usage=high -std=c99 -o";
|
||||
# mark_description " ICC/main.s";
|
||||
.file "main.c"
|
||||
.text
|
||||
..TXTST0:
|
||||
.L_2__routine_start_main_0:
|
||||
# -- Begin main
|
||||
.text
|
||||
# mark_begin;
|
||||
.align 16,0x90
|
||||
.globl main
|
||||
# --- main(int, char **)
|
||||
main:
|
||||
# parameter 1: %edi
|
||||
# parameter 2: %rsi
|
||||
..B1.1: # Preds ..B1.0
|
||||
# Execution count [1.00e+00]
|
||||
.cfi_startproc
|
||||
..___tag_value_main.1:
|
||||
..L2:
|
||||
#21.1
|
||||
pushq %rbp #21.1
|
||||
.cfi_def_cfa_offset 16
|
||||
movq %rsp, %rbp #21.1
|
||||
.cfi_def_cfa 6, 16
|
||||
.cfi_offset 6, -16
|
||||
andq $-128, %rsp #21.1
|
||||
pushq %r12 #21.1
|
||||
subq $248, %rsp #21.1
|
||||
movl %edi, 184(%rsp) #21.1
|
||||
movl $3, %edi #21.1
|
||||
movq %rsi, 168(%rsp) #21.1
|
||||
movq $0x64199d9ffe, %rsi #21.1
|
||||
call __intel_new_feature_proc_init #21.1
|
||||
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0x80, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
|
||||
# LOE rbx r13 r14 r15
|
||||
..B1.31: # Preds ..B1.1
|
||||
# Execution count [1.00e+00]
|
||||
vstmxcsr (%rsp) #21.1
|
||||
movl $2, %r12d #23.17
|
||||
lea 184(%rsp), %rdi #30.5
|
||||
orl $32832, (%rsp) #21.1
|
||||
lea 168(%rsp), %rsi #30.5
|
||||
vldmxcsr (%rsp) #21.1
|
||||
..___tag_value_main.7:
|
||||
# MPI_Init(int *, char ***)
|
||||
call MPI_Init #30.5
|
||||
..___tag_value_main.8:
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.2: # Preds ..B1.31
|
||||
# Execution count [1.00e+00]
|
||||
movl $1140850688, %edi #31.5
|
||||
lea 176(%rsp), %rsi #31.5
|
||||
..___tag_value_main.9:
|
||||
# MPI_Comm_rank(MPI_Comm, int *)
|
||||
call MPI_Comm_rank #31.5
|
||||
..___tag_value_main.10:
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.3: # Preds ..B1.2
|
||||
# Execution count [1.00e+00]
|
||||
lea 96(%rsp), %rdi #32.5
|
||||
..___tag_value_main.11:
|
||||
# initParameter(Parameter *)
|
||||
call initParameter #32.5
|
||||
..___tag_value_main.12:
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.4: # Preds ..B1.3
|
||||
# Execution count [1.00e+00]
|
||||
cmpl $2, 184(%rsp) #34.16
|
||||
jge ..B1.7 # Prob 50% #34.16
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.5: # Preds ..B1.4
|
||||
# Execution count [5.00e-01]
|
||||
movq 168(%rsp), %rax #35.9
|
||||
movl $.L_2__STRING.0, %edi #35.9
|
||||
movq (%rax), %rsi #35.9
|
||||
xorl %eax, %eax #35.9
|
||||
..___tag_value_main.13:
|
||||
# printf(const char *__restrict__, ...)
|
||||
call printf #35.9
|
||||
..___tag_value_main.14:
|
||||
# LOE
|
||||
..B1.6: # Preds ..B1.5
|
||||
# Execution count [5.00e-01]
|
||||
xorl %edi, %edi #36.9
|
||||
# exit(int)
|
||||
call exit #36.9
|
||||
# LOE
|
||||
..B1.7: # Preds ..B1.4
|
||||
# Execution count [5.00e-01]
|
||||
movq 168(%rsp), %rax #39.5
|
||||
lea 96(%rsp), %rdi #39.5
|
||||
movq 8(%rax), %rsi #39.5
|
||||
..___tag_value_main.15:
|
||||
# readParameter(Parameter *, const char *)
|
||||
call readParameter #39.5
|
||||
..___tag_value_main.16:
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.8: # Preds ..B1.7
|
||||
# Execution count [5.00e-01]
|
||||
cmpl $3, 184(%rsp) #40.17
|
||||
je ..B1.27 # Prob 16% #40.17
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.9: # Preds ..B1.28 ..B1.8
|
||||
# Execution count [5.00e-01]
|
||||
cmpl $0, 176(%rsp) #44.17
|
||||
jne ..B1.11 # Prob 78% #44.17
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.10: # Preds ..B1.9
|
||||
# Execution count [1.10e-01]
|
||||
lea 96(%rsp), %rdi #45.9
|
||||
..___tag_value_main.17:
|
||||
# printParameter(Parameter *)
|
||||
call printParameter #45.9
|
||||
..___tag_value_main.18:
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.11: # Preds ..B1.10 ..B1.9
|
||||
# Execution count [5.00e-01]
|
||||
movl $2, %edx #48.5
|
||||
lea (%rsp), %rdi #48.5
|
||||
lea 96(%rsp), %rsi #48.5
|
||||
..___tag_value_main.19:
|
||||
# initSolver(Solver *, Parameter *, int)
|
||||
call initSolver #48.5
|
||||
..___tag_value_main.20:
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.12: # Preds ..B1.11
|
||||
# Execution count [5.00e-01]
|
||||
xorl %eax, %eax #50.9
|
||||
..___tag_value_main.21:
|
||||
# getTimeStamp()
|
||||
call getTimeStamp #50.9
|
||||
..___tag_value_main.22:
|
||||
# LOE rbx r13 r14 r15 r12d xmm0
|
||||
..B1.32: # Preds ..B1.12
|
||||
# Execution count [5.00e-01]
|
||||
vmovsd %xmm0, 160(%rsp) #50.9[spill]
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.13: # Preds ..B1.32
|
||||
# Execution count [5.00e-01]
|
||||
cmpl $1, %r12d #52.13
|
||||
je ..B1.20 # Prob 25% #52.13
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.14: # Preds ..B1.13
|
||||
# Execution count [3.75e-01]
|
||||
cmpl $2, %r12d #52.13
|
||||
jne ..B1.17 # Prob 66% #52.13
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
..B1.15: # Preds ..B1.14
|
||||
# Execution count [1.25e-01]
|
||||
movl $il0_peep_printf_format_1, %edi #58.9
|
||||
call puts #58.9
|
||||
# LOE rbx r13 r14 r15
|
||||
..B1.16: # Preds ..B1.15
|
||||
# Execution count [1.25e-01]
|
||||
lea (%rsp), %rdi #59.9
|
||||
..___tag_value_main.24:
|
||||
# solveRB(Solver *)
|
||||
call solveRB #59.9
|
||||
..___tag_value_main.25:
|
||||
jmp ..B1.22 # Prob 100% #59.9
|
||||
# LOE rbx r13 r14 r15
|
||||
..B1.17: # Preds ..B1.14
|
||||
# Execution count [2.50e-01]
|
||||
cmpl $3, %r12d #52.13
|
||||
jne ..B1.22 # Prob 50% #52.13
|
||||
# LOE rbx r13 r14 r15
|
||||
..B1.18: # Preds ..B1.17
|
||||
# Execution count [1.25e-01]
|
||||
movl $il0_peep_printf_format_0, %edi #62.9
|
||||
call puts #62.9
|
||||
# LOE rbx r13 r14 r15
|
||||
..B1.19: # Preds ..B1.18
|
||||
# Execution count [1.25e-01]
|
||||
lea (%rsp), %rdi #63.9
|
||||
..___tag_value_main.26:
|
||||
# solveRBA(Solver *)
|
||||
call solveRBA #63.9
|
||||
..___tag_value_main.27:
|
||||
jmp ..B1.22 # Prob 100% #63.9
|
||||
# LOE rbx r13 r14 r15
|
||||
..B1.20: # Preds ..B1.13
|
||||
# Execution count [1.25e-01]
|
||||
movl $il0_peep_printf_format_2, %edi #54.9
|
||||
call puts #54.9
|
||||
# LOE rbx r13 r14 r15
|
||||
..B1.21: # Preds ..B1.20
|
||||
# Execution count [1.25e-01]
|
||||
lea (%rsp), %rdi #55.9
|
||||
..___tag_value_main.28:
|
||||
# solve(Solver *)
|
||||
call solve #55.9
|
||||
..___tag_value_main.29:
|
||||
# LOE rbx r13 r14 r15
|
||||
..B1.22: # Preds ..B1.21 ..B1.16 ..B1.19 ..B1.17
|
||||
# Execution count [5.00e-01]
|
||||
xorl %eax, %eax #68.9
|
||||
..___tag_value_main.30:
|
||||
# getTimeStamp()
|
||||
call getTimeStamp #68.9
|
||||
..___tag_value_main.31:
|
||||
# LOE rbx r13 r14 r15 xmm0
|
||||
..B1.23: # Preds ..B1.22
|
||||
# Execution count [5.00e-01]
|
||||
cmpl $0, 176(%rsp) #70.17
|
||||
jne ..B1.25 # Prob 78% #70.17
|
||||
# LOE rbx r13 r14 r15 xmm0
|
||||
..B1.24: # Preds ..B1.23
|
||||
# Execution count [1.10e-01]
|
||||
movl $.L_2__STRING.4, %edi #71.9
|
||||
movl $1, %eax #71.9
|
||||
vsubsd 160(%rsp), %xmm0, %xmm0 #71.9[spill]
|
||||
..___tag_value_main.32:
|
||||
# printf(const char *__restrict__, ...)
|
||||
call printf #71.9
|
||||
..___tag_value_main.33:
|
||||
# LOE rbx r13 r14 r15
|
||||
..B1.25: # Preds ..B1.24 ..B1.23
|
||||
# Execution count [5.00e-01]
|
||||
..___tag_value_main.35:
|
||||
# MPI_Finalize(void)
|
||||
call MPI_Finalize #74.5
|
||||
..___tag_value_main.36:
|
||||
# LOE rbx r13 r14 r15
|
||||
..B1.26: # Preds ..B1.25
|
||||
# Execution count [5.00e-01]
|
||||
xorl %eax, %eax #75.12
|
||||
addq $248, %rsp #75.12
|
||||
.cfi_restore 12
|
||||
popq %r12 #75.12
|
||||
movq %rbp, %rsp #75.12
|
||||
popq %rbp #75.12
|
||||
.cfi_def_cfa 7, 8
|
||||
.cfi_restore 6
|
||||
ret #75.12
|
||||
.cfi_def_cfa 6, 16
|
||||
.cfi_offset 6, -16
|
||||
.cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0x80, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xf8, 0xff, 0xff, 0xff, 0x22
|
||||
# LOE
|
||||
..B1.27: # Preds ..B1.8
|
||||
# Execution count [8.00e-02]: Infreq
|
||||
movq 168(%rsp), %rax #41.19
|
||||
movq 16(%rax), %rcx #41.19
|
||||
..___tag_value_main.43:
|
||||
call *__intel_sse4_atol@GOTPCREL(%rip) #41.19
|
||||
..___tag_value_main.44:
|
||||
# LOE rax rbx r13 r14 r15
|
||||
..B1.28: # Preds ..B1.27
|
||||
# Execution count [8.00e-02]: Infreq
|
||||
movl %eax, %r12d #41.19
|
||||
jmp ..B1.9 # Prob 100% #41.19
|
||||
.align 16,0x90
|
||||
# LOE rbx r13 r14 r15 r12d
|
||||
.cfi_endproc
|
||||
# mark_end;
|
||||
.type main,@function
|
||||
.size main,.-main
|
||||
..LNmain.0:
|
||||
.section .rodata.str1.4, "aMS",@progbits,1
|
||||
.align 4
|
||||
.align 4
|
||||
il0_peep_printf_format_1:
|
||||
.long 761554258
|
||||
.long 1667329122
|
||||
.long 1330847851
|
||||
.word 82
|
||||
.space 2, 0x00 # pad
|
||||
.align 4
|
||||
il0_peep_printf_format_0:
|
||||
.long 761554258
|
||||
.long 1667329122
|
||||
.long 1330847851
|
||||
.long 1769414738
|
||||
.long 1629513844
|
||||
.long 1818583907
|
||||
.long 1952543333
|
||||
.long 7237481
|
||||
.align 4
|
||||
il0_peep_printf_format_2:
|
||||
.long 1767992400
|
||||
.long 1330847854
|
||||
.word 82
|
||||
.data
|
||||
# -- End main
|
||||
.section .rodata.str1.4, "aMS",@progbits,1
|
||||
.space 2, 0x00 # pad
|
||||
.align 4
|
||||
.L_2__STRING.0:
|
||||
.long 1734439765
|
||||
.long 622869093
|
||||
.long 1664884851
|
||||
.long 1768320623
|
||||
.long 1818838631
|
||||
.long 671333
|
||||
.type .L_2__STRING.0,@object
|
||||
.size .L_2__STRING.0,24
|
||||
.align 4
|
||||
.L_2__STRING.4:
|
||||
.long 1970040659
|
||||
.long 1852795252
|
||||
.long 1869575200
|
||||
.long 774185067
|
||||
.long 175334962
|
||||
.byte 0
|
||||
.type .L_2__STRING.4,@object
|
||||
.size .L_2__STRING.4,21
|
||||
.data
|
||||
.section .note.GNU-stack, ""
|
||||
# End
|
817
PoissonSolver/2D-mpi/ICC/parameter.s
Normal file
817
PoissonSolver/2D-mpi/ICC/parameter.s
Normal file
@@ -0,0 +1,817 @@
|
||||
# mark_description "Intel(R) C Intel(R) 64 Compiler Classic for applications running on Intel(R) 64, Version 2021.10.0 Build 202";
|
||||
# mark_description "30609_000000";
|
||||
# mark_description "-I./src/includes -I./ICC -I/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-mpi-2021.1";
|
||||
# mark_description "0.0-ki6gcj4pr5rekayazvm4lsmvcyosce25/mpi/2021.10.0/include -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux";
|
||||
# mark_description "8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux";
|
||||
# mark_description "/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-ax";
|
||||
# mark_description "ze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/x64 -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almal";
|
||||
# mark_description "inux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/l";
|
||||
# mark_description "inux/lib/oclfpga/host/linux64/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel";
|
||||
# mark_description "-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/oclfpga/linux64/lib ";
|
||||
# mark_description "-Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7oc";
|
||||
# mark_description "bc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/compiler/lib/intel64_lin -gcc-name=/usr/bin/gcc -gxx-name=";
|
||||
# mark_description "/usr/bin/g++ -S -fverbose-asm -D_GNU_SOURCE -DARRAY_ALIGNMENT=64 -O3 -xHost -qopt-zmm-usage=high -std=c99 -o";
|
||||
# mark_description " ICC/parameter.s";
|
||||
.file "parameter.c"
|
||||
.text
|
||||
..TXTST0:
|
||||
.L_2__routine_start_readParameter_0:
|
||||
# -- Begin readParameter
|
||||
.text
|
||||
# mark_begin;
|
||||
.align 16,0x90
|
||||
.globl readParameter
|
||||
# --- readParameter(Parameter *, const char *)
|
||||
readParameter:
|
||||
# parameter 1: %rdi
|
||||
# parameter 2: %rsi
|
||||
..B1.1: # Preds ..B1.0
|
||||
# Execution count [1.00e+00]
|
||||
.cfi_startproc
|
||||
..___tag_value_readParameter.1:
|
||||
..L2:
|
||||
#26.60
|
||||
pushq %r12 #26.60
|
||||
.cfi_def_cfa_offset 16
|
||||
.cfi_offset 12, -16
|
||||
pushq %r13 #26.60
|
||||
.cfi_def_cfa_offset 24
|
||||
.cfi_offset 13, -24
|
||||
pushq %r14 #26.60
|
||||
.cfi_def_cfa_offset 32
|
||||
.cfi_offset 14, -32
|
||||
subq $4112, %rsp #26.60
|
||||
.cfi_def_cfa_offset 4144
|
||||
movq %rsi, %r14 #26.60
|
||||
movq %rdi, %r13 #26.60
|
||||
movq %r14, %rdi #27.16
|
||||
movl $.L_2__STRING.0, %esi #27.16
|
||||
# fopen(const char *__restrict__, const char *__restrict__)
|
||||
call fopen #27.16
|
||||
# LOE rax rbx rbp r13 r14 r15
|
||||
..B1.76: # Preds ..B1.1
|
||||
# Execution count [1.00e+00]
|
||||
movq %rax, %r12 #27.16
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.2: # Preds ..B1.76
|
||||
# Execution count [1.00e+00]
|
||||
testq %r12, %r12 #31.9
|
||||
je ..B1.72 # Prob 0% #31.9
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.3: # Preds ..B1.2
|
||||
# Execution count [9.93e-01]
|
||||
movq %r12, %rdi #36.12
|
||||
# feof(FILE *)
|
||||
call feof #36.12
|
||||
# LOE rbx rbp r12 r13 r15 eax
|
||||
..B1.77: # Preds ..B1.3
|
||||
# Execution count [9.93e-01]
|
||||
testl %eax, %eax #36.12
|
||||
jne ..B1.55 # Prob 10% #36.12
|
||||
# LOE rbx rbp r12 r13 r15
|
||||
..B1.4: # Preds ..B1.77
|
||||
# Execution count [8.94e-01]
|
||||
movq %r15, 4096(%rsp) #[spill]
|
||||
.cfi_offset 15, -48
|
||||
# LOE rbx rbp r12 r13
|
||||
..B1.5: # Preds ..B1.96 ..B1.4
|
||||
# Execution count [4.96e+00]
|
||||
movl $4096, %esi #38.9
|
||||
lea (%rsp), %rdi #38.9
|
||||
movq %r12, %rdx #38.9
|
||||
movb $0, (%rdi) #37.9
|
||||
# fgets(char *__restrict__, int, FILE *__restrict__)
|
||||
call fgets #38.9
|
||||
# LOE rbx rbp r12 r13
|
||||
..B1.6: # Preds ..B1.5
|
||||
# Execution count [4.96e+00]
|
||||
xorl %ecx, %ecx #39.13
|
||||
cmpb $0, (%rsp) #39.31
|
||||
je ..B1.25 # Prob 10% #39.31
|
||||
# LOE rbx rbp r12 r13 ecx
|
||||
..B1.7: # Preds ..B1.6
|
||||
# Execution count [5.58e-01]
|
||||
xorl %eax, %eax #39.9
|
||||
# LOE rax rbx rbp r12 r13 ecx
|
||||
..B1.8: # Preds ..B1.23 ..B1.7
|
||||
# Execution count [1.62e+00]
|
||||
incq %rax #39.9
|
||||
cmpb $35, -8(%rsp,%rax,8) #39.50
|
||||
je ..B1.25 # Prob 20% #39.50
|
||||
# LOE rax rbx rbp r12 r13 ecx
|
||||
..B1.9: # Preds ..B1.8
|
||||
# Execution count [1.30e+00]
|
||||
movl %eax, %r8d #39.55
|
||||
movb -7(%rsp,%rax,8), %sil #39.20
|
||||
lea (,%r8,8), %r9d #39.55
|
||||
lea -7(,%r8,8), %ecx #39.55
|
||||
testb %sil, %sil #39.31
|
||||
je ..B1.25 # Prob 18% #39.31
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d sil
|
||||
..B1.10: # Preds ..B1.9
|
||||
# Execution count [0.00e+00]
|
||||
cmpb $35, %sil #39.50
|
||||
je ..B1.25 # Prob 20% #39.50
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d
|
||||
..B1.11: # Preds ..B1.10
|
||||
# Execution count [1.30e+00]
|
||||
movb -6(%rsp,%rax,8), %sil #39.20
|
||||
lea -6(,%r8,8), %ecx #39.55
|
||||
testb %sil, %sil #39.31
|
||||
je ..B1.25 # Prob 18% #39.31
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d sil
|
||||
..B1.12: # Preds ..B1.11
|
||||
# Execution count [0.00e+00]
|
||||
cmpb $35, %sil #39.50
|
||||
je ..B1.25 # Prob 20% #39.50
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d
|
||||
..B1.13: # Preds ..B1.12
|
||||
# Execution count [1.30e+00]
|
||||
movb -5(%rsp,%rax,8), %sil #39.20
|
||||
lea -5(,%r8,8), %ecx #39.55
|
||||
testb %sil, %sil #39.31
|
||||
je ..B1.25 # Prob 18% #39.31
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d sil
|
||||
..B1.14: # Preds ..B1.13
|
||||
# Execution count [0.00e+00]
|
||||
cmpb $35, %sil #39.50
|
||||
je ..B1.25 # Prob 20% #39.50
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d
|
||||
..B1.15: # Preds ..B1.14
|
||||
# Execution count [1.30e+00]
|
||||
movb -4(%rsp,%rax,8), %sil #39.20
|
||||
lea -4(,%r8,8), %ecx #39.55
|
||||
testb %sil, %sil #39.31
|
||||
je ..B1.25 # Prob 18% #39.31
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d sil
|
||||
..B1.16: # Preds ..B1.15
|
||||
# Execution count [0.00e+00]
|
||||
cmpb $35, %sil #39.50
|
||||
je ..B1.25 # Prob 20% #39.50
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d
|
||||
..B1.17: # Preds ..B1.16
|
||||
# Execution count [1.30e+00]
|
||||
movb -3(%rsp,%rax,8), %sil #39.20
|
||||
lea -3(,%r8,8), %ecx #39.55
|
||||
testb %sil, %sil #39.31
|
||||
je ..B1.25 # Prob 18% #39.31
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d sil
|
||||
..B1.18: # Preds ..B1.17
|
||||
# Execution count [0.00e+00]
|
||||
cmpb $35, %sil #39.50
|
||||
je ..B1.25 # Prob 20% #39.50
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d
|
||||
..B1.19: # Preds ..B1.18
|
||||
# Execution count [1.30e+00]
|
||||
movb -2(%rsp,%rax,8), %sil #39.20
|
||||
lea -2(,%r8,8), %ecx #39.55
|
||||
testb %sil, %sil #39.31
|
||||
je ..B1.25 # Prob 18% #39.31
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d sil
|
||||
..B1.20: # Preds ..B1.19
|
||||
# Execution count [0.00e+00]
|
||||
cmpb $35, %sil #39.50
|
||||
je ..B1.25 # Prob 20% #39.50
|
||||
# LOE rax rbx rbp r12 r13 ecx r8d r9d
|
||||
..B1.21: # Preds ..B1.20
|
||||
# Execution count [1.30e+00]
|
||||
movb -1(%rsp,%rax,8), %sil #39.20
|
||||
lea -1(,%r8,8), %ecx #39.55
|
||||
testb %sil, %sil #39.31
|
||||
je ..B1.25 # Prob 18% #39.31
|
||||
# LOE rax rbx rbp r12 r13 ecx r9d sil
|
||||
..B1.22: # Preds ..B1.21
|
||||
# Execution count [0.00e+00]
|
||||
cmpb $35, %sil #39.50
|
||||
je ..B1.25 # Prob 20% #39.50
|
||||
# LOE rax rbx rbp r12 r13 ecx r9d
|
||||
..B1.23: # Preds ..B1.22
|
||||
# Execution count [1.30e+00]
|
||||
movl %r9d, %ecx #39.55
|
||||
cmpb $0, (%rsp,%rax,8) #39.31
|
||||
jne ..B1.8 # Prob 82% #39.31
|
||||
# LOE rax rbx rbp r12 r13 ecx
|
||||
..B1.25: # Preds ..B1.21 ..B1.22 ..B1.20 ..B1.19 ..B1.18
|
||||
# ..B1.17 ..B1.16 ..B1.15 ..B1.14 ..B1.13
|
||||
# ..B1.12 ..B1.11 ..B1.10 ..B1.9 ..B1.8
|
||||
# ..B1.23 ..B1.6
|
||||
# Execution count [4.96e+00]
|
||||
movslq %ecx, %rcx #40.9
|
||||
movl $.L_2__STRING.2, %edx #42.21
|
||||
movb $0, (%rsp,%rcx) #40.9
|
||||
lea (%rsp), %rcx #42.21
|
||||
..___tag_value_readParameter.12:
|
||||
call *__intel_sse4_strtok@GOTPCREL(%rip) #42.21
|
||||
..___tag_value_readParameter.13:
|
||||
# LOE rax rbx rbp r12 r13
|
||||
..B1.78: # Preds ..B1.25
|
||||
# Execution count [4.96e+00]
|
||||
movq %rax, %r14 #42.21
|
||||
# LOE rbx rbp r12 r13 r14
|
||||
..B1.26: # Preds ..B1.78
|
||||
# Execution count [4.96e+00]
|
||||
xorl %ecx, %ecx #43.21
|
||||
movl $.L_2__STRING.2, %edx #43.21
|
||||
..___tag_value_readParameter.14:
|
||||
call *__intel_sse4_strtok@GOTPCREL(%rip) #43.21
|
||||
..___tag_value_readParameter.15:
|
||||
# LOE rax rbx rbp r12 r13 r14
|
||||
..B1.79: # Preds ..B1.26
|
||||
# Execution count [4.96e+00]
|
||||
movq %rax, %r15 #43.21
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.27: # Preds ..B1.79
|
||||
# Execution count [4.96e+00]
|
||||
testq %r14, %r14 #50.19
|
||||
je ..B1.53 # Prob 12% #50.19
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.28: # Preds ..B1.27
|
||||
# Execution count [4.37e+00]
|
||||
testq %r15, %r15 #50.34
|
||||
je ..B1.53 # Prob 12% #50.34
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.29: # Preds ..B1.28
|
||||
# Execution count [3.84e+00]
|
||||
movq %r14, %rax #51.13
|
||||
movl $.L_2__STRING.3, %ecx #51.13
|
||||
movl $7, %edx #51.13
|
||||
..___tag_value_readParameter.16:
|
||||
call *__intel_sse4_strncmp@GOTPCREL(%rip) #51.13
|
||||
..___tag_value_readParameter.17:
|
||||
# LOE rbx rbp r12 r13 r14 r15 eax
|
||||
..B1.80: # Preds ..B1.29
|
||||
# Execution count [3.84e+00]
|
||||
testl %eax, %eax #51.13
|
||||
jne ..B1.32 # Prob 50% #51.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.30: # Preds ..B1.80
|
||||
# Execution count [1.92e+00]
|
||||
movq %r15, %rdi #51.13
|
||||
xorl %esi, %esi #51.13
|
||||
# strtod(const char *__restrict__, char **__restrict__)
|
||||
call strtod #51.13
|
||||
# LOE rbx rbp r12 r13 r14 r15 xmm0
|
||||
..B1.31: # Preds ..B1.30
|
||||
# Execution count [1.92e+00]
|
||||
vmovsd %xmm0, (%r13) #51.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.32: # Preds ..B1.80 ..B1.31
|
||||
# Execution count [3.84e+00]
|
||||
movq %r14, %rax #52.13
|
||||
movl $.L_2__STRING.4, %ecx #52.13
|
||||
movl $7, %edx #52.13
|
||||
..___tag_value_readParameter.18:
|
||||
call *__intel_sse4_strncmp@GOTPCREL(%rip) #52.13
|
||||
..___tag_value_readParameter.19:
|
||||
# LOE rbx rbp r12 r13 r14 r15 eax
|
||||
..B1.82: # Preds ..B1.32
|
||||
# Execution count [3.84e+00]
|
||||
testl %eax, %eax #52.13
|
||||
jne ..B1.35 # Prob 50% #52.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.33: # Preds ..B1.82
|
||||
# Execution count [1.92e+00]
|
||||
movq %r15, %rdi #52.13
|
||||
xorl %esi, %esi #52.13
|
||||
# strtod(const char *__restrict__, char **__restrict__)
|
||||
call strtod #52.13
|
||||
# LOE rbx rbp r12 r13 r14 r15 xmm0
|
||||
..B1.34: # Preds ..B1.33
|
||||
# Execution count [1.92e+00]
|
||||
vmovsd %xmm0, 8(%r13) #52.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.35: # Preds ..B1.82 ..B1.34
|
||||
# Execution count [3.84e+00]
|
||||
movq %r14, %rax #53.13
|
||||
movl $.L_2__STRING.5, %ecx #53.13
|
||||
movl $4, %edx #53.13
|
||||
..___tag_value_readParameter.20:
|
||||
call *__intel_sse4_strncmp@GOTPCREL(%rip) #53.13
|
||||
..___tag_value_readParameter.21:
|
||||
# LOE rbx rbp r12 r13 r14 r15 eax
|
||||
..B1.84: # Preds ..B1.35
|
||||
# Execution count [3.84e+00]
|
||||
testl %eax, %eax #53.13
|
||||
jne ..B1.38 # Prob 50% #53.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.36: # Preds ..B1.84
|
||||
# Execution count [1.92e+00]
|
||||
movq %r15, %rcx #53.13
|
||||
..___tag_value_readParameter.22:
|
||||
call *__intel_sse4_atol@GOTPCREL(%rip) #53.13
|
||||
..___tag_value_readParameter.23:
|
||||
# LOE rax rbx rbp r12 r13 r14 r15
|
||||
..B1.37: # Preds ..B1.36
|
||||
# Execution count [1.92e+00]
|
||||
movl %eax, 16(%r13) #53.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.38: # Preds ..B1.84 ..B1.37
|
||||
# Execution count [3.84e+00]
|
||||
movq %r14, %rax #54.13
|
||||
movl $.L_2__STRING.6, %ecx #54.13
|
||||
movl $4, %edx #54.13
|
||||
..___tag_value_readParameter.24:
|
||||
call *__intel_sse4_strncmp@GOTPCREL(%rip) #54.13
|
||||
..___tag_value_readParameter.25:
|
||||
# LOE rbx rbp r12 r13 r14 r15 eax
|
||||
..B1.86: # Preds ..B1.38
|
||||
# Execution count [3.84e+00]
|
||||
testl %eax, %eax #54.13
|
||||
jne ..B1.41 # Prob 50% #54.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.39: # Preds ..B1.86
|
||||
# Execution count [1.92e+00]
|
||||
movq %r15, %rcx #54.13
|
||||
..___tag_value_readParameter.26:
|
||||
call *__intel_sse4_atol@GOTPCREL(%rip) #54.13
|
||||
..___tag_value_readParameter.27:
|
||||
# LOE rax rbx rbp r12 r13 r14 r15
|
||||
..B1.40: # Preds ..B1.39
|
||||
# Execution count [1.92e+00]
|
||||
movl %eax, 20(%r13) #54.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.41: # Preds ..B1.86 ..B1.40
|
||||
# Execution count [3.84e+00]
|
||||
movq %r14, %rax #55.13
|
||||
movl $.L_2__STRING.7, %ecx #55.13
|
||||
movl $7, %edx #55.13
|
||||
..___tag_value_readParameter.28:
|
||||
call *__intel_sse4_strncmp@GOTPCREL(%rip) #55.13
|
||||
..___tag_value_readParameter.29:
|
||||
# LOE rbx rbp r12 r13 r14 r15 eax
|
||||
..B1.88: # Preds ..B1.41
|
||||
# Execution count [3.84e+00]
|
||||
testl %eax, %eax #55.13
|
||||
jne ..B1.44 # Prob 50% #55.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.42: # Preds ..B1.88
|
||||
# Execution count [1.92e+00]
|
||||
movq %r15, %rcx #55.13
|
||||
..___tag_value_readParameter.30:
|
||||
call *__intel_sse4_atol@GOTPCREL(%rip) #55.13
|
||||
..___tag_value_readParameter.31:
|
||||
# LOE rax rbx rbp r12 r13 r14 r15
|
||||
..B1.43: # Preds ..B1.42
|
||||
# Execution count [1.92e+00]
|
||||
movl %eax, 24(%r13) #55.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.44: # Preds ..B1.88 ..B1.43
|
||||
# Execution count [3.84e+00]
|
||||
movq %r14, %rax #56.13
|
||||
movl $.L_2__STRING.8, %ecx #56.13
|
||||
movl $3, %edx #56.13
|
||||
..___tag_value_readParameter.32:
|
||||
call *__intel_sse4_strncmp@GOTPCREL(%rip) #56.13
|
||||
..___tag_value_readParameter.33:
|
||||
# LOE rbx rbp r12 r13 r14 r15 eax
|
||||
..B1.90: # Preds ..B1.44
|
||||
# Execution count [3.84e+00]
|
||||
testl %eax, %eax #56.13
|
||||
jne ..B1.47 # Prob 50% #56.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.45: # Preds ..B1.90
|
||||
# Execution count [1.92e+00]
|
||||
movq %r15, %rdi #56.13
|
||||
xorl %esi, %esi #56.13
|
||||
# strtod(const char *__restrict__, char **__restrict__)
|
||||
call strtod #56.13
|
||||
# LOE rbx rbp r12 r13 r14 r15 xmm0
|
||||
..B1.46: # Preds ..B1.45
|
||||
# Execution count [1.92e+00]
|
||||
vmovsd %xmm0, 32(%r13) #56.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.47: # Preds ..B1.90 ..B1.46
|
||||
# Execution count [3.84e+00]
|
||||
movq %r14, %rax #57.13
|
||||
movl $.L_2__STRING.9, %ecx #57.13
|
||||
movl $3, %edx #57.13
|
||||
..___tag_value_readParameter.34:
|
||||
call *__intel_sse4_strncmp@GOTPCREL(%rip) #57.13
|
||||
..___tag_value_readParameter.35:
|
||||
# LOE rbx rbp r12 r13 r14 r15 eax
|
||||
..B1.92: # Preds ..B1.47
|
||||
# Execution count [3.84e+00]
|
||||
testl %eax, %eax #57.13
|
||||
jne ..B1.50 # Prob 50% #57.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.48: # Preds ..B1.92
|
||||
# Execution count [1.92e+00]
|
||||
movq %r15, %rdi #57.13
|
||||
xorl %esi, %esi #57.13
|
||||
# strtod(const char *__restrict__, char **__restrict__)
|
||||
call strtod #57.13
|
||||
# LOE rbx rbp r12 r13 r14 r15 xmm0
|
||||
..B1.49: # Preds ..B1.48
|
||||
# Execution count [1.92e+00]
|
||||
vmovsd %xmm0, 40(%r13) #57.13
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.50: # Preds ..B1.92 ..B1.49
|
||||
# Execution count [3.84e+00]
|
||||
movq %r14, %rax #58.13
|
||||
movl $.L_2__STRING.10, %ecx #58.13
|
||||
movl $3, %edx #58.13
|
||||
..___tag_value_readParameter.36:
|
||||
call *__intel_sse4_strncmp@GOTPCREL(%rip) #58.13
|
||||
..___tag_value_readParameter.37:
|
||||
# LOE rbx rbp r12 r13 r15 eax
|
||||
..B1.94: # Preds ..B1.50
|
||||
# Execution count [3.84e+00]
|
||||
testl %eax, %eax #58.13
|
||||
jne ..B1.53 # Prob 50% #58.13
|
||||
# LOE rbx rbp r12 r13 r15
|
||||
..B1.51: # Preds ..B1.94
|
||||
# Execution count [1.92e+00]
|
||||
movq %r15, %rdi #58.13
|
||||
xorl %esi, %esi #58.13
|
||||
# strtod(const char *__restrict__, char **__restrict__)
|
||||
call strtod #58.13
|
||||
# LOE rbx rbp r12 r13 xmm0
|
||||
..B1.52: # Preds ..B1.51
|
||||
# Execution count [1.92e+00]
|
||||
vmovsd %xmm0, 56(%r13) #58.13
|
||||
# LOE rbx rbp r12 r13
|
||||
..B1.53: # Preds ..B1.94 ..B1.28 ..B1.27 ..B1.52
|
||||
# Execution count [4.96e+00]
|
||||
movq %r12, %rdi #36.12
|
||||
# feof(FILE *)
|
||||
call feof #36.12
|
||||
# LOE rbx rbp r12 r13 eax
|
||||
..B1.96: # Preds ..B1.53
|
||||
# Execution count [4.96e+00]
|
||||
testl %eax, %eax #36.12
|
||||
je ..B1.5 # Prob 82% #36.12
|
||||
# LOE rbx rbp r12 r13
|
||||
..B1.54: # Preds ..B1.96
|
||||
# Execution count [8.94e-01]
|
||||
movq 4096(%rsp), %r15 #[spill]
|
||||
.cfi_restore 15
|
||||
# LOE rbx rbp r12 r15
|
||||
..B1.55: # Preds ..B1.54 ..B1.77
|
||||
# Execution count [9.93e-01]
|
||||
movq %r12, %rdi #63.5
|
||||
# fclose(FILE *)
|
||||
call fclose #63.5
|
||||
# LOE rbx rbp r15
|
||||
..B1.56: # Preds ..B1.55
|
||||
# Execution count [9.93e-01]
|
||||
addq $4112, %rsp #64.1
|
||||
.cfi_def_cfa_offset 32
|
||||
.cfi_restore 14
|
||||
popq %r14 #64.1
|
||||
.cfi_def_cfa_offset 24
|
||||
.cfi_restore 13
|
||||
popq %r13 #64.1
|
||||
.cfi_def_cfa_offset 16
|
||||
.cfi_restore 12
|
||||
popq %r12 #64.1
|
||||
.cfi_def_cfa_offset 8
|
||||
ret #64.1
|
||||
.cfi_def_cfa_offset 4144
|
||||
.cfi_offset 12, -16
|
||||
.cfi_offset 13, -24
|
||||
.cfi_offset 14, -32
|
||||
# LOE
|
||||
..B1.72: # Preds ..B1.2
|
||||
# Execution count [7.13e-03]: Infreq
|
||||
movl $.L_2__STRING.1, %esi #32.9
|
||||
movq %r14, %rdx #32.9
|
||||
xorl %eax, %eax #32.9
|
||||
movq stderr(%rip), %rdi #32.9
|
||||
# fprintf(FILE *__restrict__, const char *__restrict__, ...)
|
||||
call fprintf #32.9
|
||||
# LOE
|
||||
..B1.73: # Preds ..B1.72
|
||||
# Execution count [7.13e-03]: Infreq
|
||||
movl $1, %edi #33.9
|
||||
# exit(int)
|
||||
call exit #33.9
|
||||
.align 16,0x90
|
||||
# LOE
|
||||
.cfi_endproc
|
||||
# mark_end;
|
||||
.type readParameter,@function
|
||||
.size readParameter,.-readParameter
|
||||
..LNreadParameter.0:
|
||||
.data
|
||||
# -- End readParameter
|
||||
.text
|
||||
.L_2__routine_start_printParameter_1:
|
||||
# -- Begin printParameter
|
||||
.text
|
||||
# mark_begin;
|
||||
.align 16,0x90
|
||||
.globl printParameter
|
||||
# --- printParameter(Parameter *)
|
||||
printParameter:
|
||||
# parameter 1: %rdi
|
||||
..B2.1: # Preds ..B2.0
|
||||
# Execution count [1.00e+00]
|
||||
.cfi_startproc
|
||||
..___tag_value_printParameter.51:
|
||||
..L52:
|
||||
#66.39
|
||||
pushq %r14 #66.39
|
||||
.cfi_def_cfa_offset 16
|
||||
.cfi_offset 14, -16
|
||||
movq %rdi, %r14 #66.39
|
||||
movl $il0_peep_printf_format_0, %edi #67.5
|
||||
call puts #67.5
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B2.2: # Preds ..B2.1
|
||||
# Execution count [1.00e+00]
|
||||
movl $il0_peep_printf_format_1, %edi #68.5
|
||||
call puts #68.5
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B2.3: # Preds ..B2.2
|
||||
# Execution count [1.00e+00]
|
||||
vmovsd (%r14), %xmm0 #69.5
|
||||
movl $.L_2__STRING.13, %edi #69.5
|
||||
vmovsd 8(%r14), %xmm1 #69.5
|
||||
movl $2, %eax #69.5
|
||||
..___tag_value_printParameter.55:
|
||||
# printf(const char *__restrict__, ...)
|
||||
call printf #69.5
|
||||
..___tag_value_printParameter.56:
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B2.4: # Preds ..B2.3
|
||||
# Execution count [1.00e+00]
|
||||
movl $.L_2__STRING.14, %edi #70.5
|
||||
xorl %eax, %eax #70.5
|
||||
movl 16(%r14), %esi #70.5
|
||||
movl 20(%r14), %edx #70.5
|
||||
..___tag_value_printParameter.57:
|
||||
# printf(const char *__restrict__, ...)
|
||||
call printf #70.5
|
||||
..___tag_value_printParameter.58:
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B2.5: # Preds ..B2.4
|
||||
# Execution count [1.00e+00]
|
||||
movl $il0_peep_printf_format_2, %edi #71.5
|
||||
call puts #71.5
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B2.6: # Preds ..B2.5
|
||||
# Execution count [1.00e+00]
|
||||
movl $.L_2__STRING.16, %edi #72.5
|
||||
xorl %eax, %eax #72.5
|
||||
movl 24(%r14), %esi #72.5
|
||||
..___tag_value_printParameter.59:
|
||||
# printf(const char *__restrict__, ...)
|
||||
call printf #72.5
|
||||
..___tag_value_printParameter.60:
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B2.7: # Preds ..B2.6
|
||||
# Execution count [1.00e+00]
|
||||
vmovsd 32(%r14), %xmm0 #73.5
|
||||
movl $.L_2__STRING.17, %edi #73.5
|
||||
movl $1, %eax #73.5
|
||||
..___tag_value_printParameter.61:
|
||||
# printf(const char *__restrict__, ...)
|
||||
call printf #73.5
|
||||
..___tag_value_printParameter.62:
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B2.8: # Preds ..B2.7
|
||||
# Execution count [1.00e+00]
|
||||
vmovsd 40(%r14), %xmm0 #74.5
|
||||
movl $.L_2__STRING.18, %edi #74.5
|
||||
movl $1, %eax #74.5
|
||||
.cfi_restore 14
|
||||
popq %r14 #74.5
|
||||
.cfi_def_cfa_offset 8
|
||||
# printf(const char *__restrict__, ...)
|
||||
jmp printf #74.5
|
||||
.align 16,0x90
|
||||
# LOE
|
||||
.cfi_endproc
|
||||
# mark_end;
|
||||
.type printParameter,@function
|
||||
.size printParameter,.-printParameter
|
||||
..LNprintParameter.1:
|
||||
.section .rodata.str1.4, "aMS",@progbits,1
|
||||
.align 4
|
||||
.align 4
|
||||
il0_peep_printf_format_0:
|
||||
.long 1634885968
|
||||
.long 1702126957
|
||||
.long 3830642
|
||||
.align 4
|
||||
il0_peep_printf_format_1:
|
||||
.long 1836016967
|
||||
.long 2037544037
|
||||
.long 1952539680
|
||||
.word 14945
|
||||
.byte 0
|
||||
.space 1, 0x00 # pad
|
||||
.align 4
|
||||
il0_peep_printf_format_2:
|
||||
.long 1919251529
|
||||
.long 1986622561
|
||||
.long 1869815909
|
||||
.long 1919252076
|
||||
.long 1918988320
|
||||
.long 1952804193
|
||||
.long 980644453
|
||||
.byte 0
|
||||
.data
|
||||
# -- End printParameter
|
||||
.text
|
||||
.L_2__routine_start_initParameter_2:
|
||||
# -- Begin initParameter
|
||||
.text
|
||||
# mark_begin;
|
||||
.align 16,0x90
|
||||
.globl initParameter
|
||||
# --- initParameter(Parameter *)
|
||||
initParameter:
|
||||
# parameter 1: %rdi
|
||||
..B3.1: # Preds ..B3.0
|
||||
# Execution count [1.00e+00]
|
||||
.cfi_startproc
|
||||
..___tag_value_initParameter.66:
|
||||
..L67:
|
||||
#15.38
|
||||
movq $0x3ff0000000000000, %rax #16.5
|
||||
movl $100, %edx #18.5
|
||||
movq $0x3f1a36e2eb1c432d, %rcx #21.18
|
||||
movq $0x3ffccccccccccccd, %rsi #22.18
|
||||
movq $0x3fefae147ae147ae, %r8 #23.22
|
||||
movq %rax, (%rdi) #16.5
|
||||
movq %rax, 8(%rdi) #17.5
|
||||
movl %edx, 16(%rdi) #18.5
|
||||
movl %edx, 20(%rdi) #19.5
|
||||
movl $1000, 24(%rdi) #20.5
|
||||
movq %rcx, 32(%rdi) #21.5
|
||||
movq %rsi, 40(%rdi) #22.5
|
||||
movq %r8, 56(%rdi) #23.5
|
||||
ret #24.1
|
||||
.align 16,0x90
|
||||
# LOE
|
||||
.cfi_endproc
|
||||
# mark_end;
|
||||
.type initParameter,@function
|
||||
.size initParameter,.-initParameter
|
||||
..LNinitParameter.2:
|
||||
.data
|
||||
# -- End initParameter
|
||||
.section .rodata, "a"
|
||||
.align 8
|
||||
.align 8
|
||||
.L_2il0floatpacket.0:
|
||||
.long 0xeb1c432d,0x3f1a36e2
|
||||
.type .L_2il0floatpacket.0,@object
|
||||
.size .L_2il0floatpacket.0,8
|
||||
.align 8
|
||||
.L_2il0floatpacket.1:
|
||||
.long 0xcccccccd,0x3ffccccc
|
||||
.type .L_2il0floatpacket.1,@object
|
||||
.size .L_2il0floatpacket.1,8
|
||||
.align 8
|
||||
.L_2il0floatpacket.2:
|
||||
.long 0x7ae147ae,0x3fefae14
|
||||
.type .L_2il0floatpacket.2,@object
|
||||
.size .L_2il0floatpacket.2,8
|
||||
.align 8
|
||||
.L_2il0floatpacket.3:
|
||||
.long 0x00000000,0x3ff00000
|
||||
.type .L_2il0floatpacket.3,@object
|
||||
.size .L_2il0floatpacket.3,8
|
||||
.section .rodata.str1.4, "aMS",@progbits,1
|
||||
.space 3, 0x00 # pad
|
||||
.align 4
|
||||
.L_2__STRING.0:
|
||||
.word 114
|
||||
.type .L_2__STRING.0,@object
|
||||
.size .L_2__STRING.0,2
|
||||
.space 2, 0x00 # pad
|
||||
.align 4
|
||||
.L_2__STRING.2:
|
||||
.word 32
|
||||
.type .L_2__STRING.2,@object
|
||||
.size .L_2__STRING.2,2
|
||||
.space 2, 0x00 # pad
|
||||
.align 4
|
||||
.L_2__STRING.3:
|
||||
.long 1852140664
|
||||
.long 6845543
|
||||
.type .L_2__STRING.3,@object
|
||||
.size .L_2__STRING.3,8
|
||||
.align 4
|
||||
.L_2__STRING.4:
|
||||
.long 1852140665
|
||||
.long 6845543
|
||||
.type .L_2__STRING.4,@object
|
||||
.size .L_2__STRING.4,8
|
||||
.align 4
|
||||
.L_2__STRING.5:
|
||||
.long 2019650921
|
||||
.byte 0
|
||||
.type .L_2__STRING.5,@object
|
||||
.size .L_2__STRING.5,5
|
||||
.space 3, 0x00 # pad
|
||||
.align 4
|
||||
.L_2__STRING.6:
|
||||
.long 2019650922
|
||||
.byte 0
|
||||
.type .L_2__STRING.6,@object
|
||||
.size .L_2__STRING.6,5
|
||||
.space 3, 0x00 # pad
|
||||
.align 4
|
||||
.L_2__STRING.7:
|
||||
.long 1919251561
|
||||
.long 7889261
|
||||
.type .L_2__STRING.7,@object
|
||||
.size .L_2__STRING.7,8
|
||||
.align 4
|
||||
.L_2__STRING.8:
|
||||
.long 7565413
|
||||
.type .L_2__STRING.8,@object
|
||||
.size .L_2__STRING.8,4
|
||||
.align 4
|
||||
.L_2__STRING.9:
|
||||
.long 6778223
|
||||
.type .L_2__STRING.9,@object
|
||||
.size .L_2__STRING.9,4
|
||||
.align 4
|
||||
.L_2__STRING.10:
|
||||
.long 7301234
|
||||
.type .L_2__STRING.10,@object
|
||||
.size .L_2__STRING.10,4
|
||||
.align 4
|
||||
.L_2__STRING.1:
|
||||
.long 1819635523
|
||||
.long 1869488228
|
||||
.long 1886330996
|
||||
.long 1881173605
|
||||
.long 1835102817
|
||||
.long 1919251557
|
||||
.long 1818846752
|
||||
.long 622869093
|
||||
.word 2675
|
||||
.byte 0
|
||||
.type .L_2__STRING.1,@object
|
||||
.size .L_2__STRING.1,35
|
||||
.space 1, 0x00 # pad
|
||||
.align 4
|
||||
.L_2__STRING.13:
|
||||
.long 1836008457
|
||||
.long 544106849
|
||||
.long 544763746
|
||||
.long 1702521203
|
||||
.long 746072096
|
||||
.long 975796512
|
||||
.long 744826144
|
||||
.long 174400800
|
||||
.byte 0
|
||||
.type .L_2__STRING.13,@object
|
||||
.size .L_2__STRING.13,33
|
||||
.space 3, 0x00 # pad
|
||||
.align 4
|
||||
.L_2__STRING.14:
|
||||
.long 1818575625
|
||||
.long 673215340
|
||||
.long 2032151672
|
||||
.long 622869033
|
||||
.long 622865508
|
||||
.word 2660
|
||||
.byte 0
|
||||
.type .L_2__STRING.14,@object
|
||||
.size .L_2__STRING.14,23
|
||||
.space 1, 0x00 # pad
|
||||
.align 4
|
||||
.L_2__STRING.16:
|
||||
.long 2019642633
|
||||
.long 1702127904
|
||||
.long 1769234802
|
||||
.long 980643439
|
||||
.long 174335264
|
||||
.byte 0
|
||||
.type .L_2__STRING.16,@object
|
||||
.size .L_2__STRING.16,21
|
||||
.space 3, 0x00 # pad
|
||||
.align 4
|
||||
.L_2__STRING.17:
|
||||
.long 1936745737
|
||||
.long 1852796009
|
||||
.long 1953703968
|
||||
.long 1768976495
|
||||
.long 1948280686
|
||||
.long 1919249519
|
||||
.long 1701015137
|
||||
.long 540680233
|
||||
.long 681253
|
||||
.type .L_2__STRING.17,@object
|
||||
.size .L_2__STRING.17,36
|
||||
.align 4
|
||||
.L_2__STRING.18:
|
||||
.long 1701670665
|
||||
.long 673210727
|
||||
.long 542265171
|
||||
.long 1634493810
|
||||
.long 1769234808
|
||||
.long 975793775
|
||||
.long 174400800
|
||||
.byte 0
|
||||
.type .L_2__STRING.18,@object
|
||||
.size .L_2__STRING.18,29
|
||||
.data
|
||||
.section .note.GNU-stack, ""
|
||||
# End
|
4206
PoissonSolver/2D-mpi/ICC/solver.s
Normal file
4206
PoissonSolver/2D-mpi/ICC/solver.s
Normal file
File diff suppressed because it is too large
Load Diff
151
PoissonSolver/2D-mpi/ICC/timing.s
Normal file
151
PoissonSolver/2D-mpi/ICC/timing.s
Normal file
@@ -0,0 +1,151 @@
|
||||
# mark_description "Intel(R) C Intel(R) 64 Compiler Classic for applications running on Intel(R) 64, Version 2021.10.0 Build 202";
|
||||
# mark_description "30609_000000";
|
||||
# mark_description "-I./src/includes -I./ICC -I/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-mpi-2021.1";
|
||||
# mark_description "0.0-ki6gcj4pr5rekayazvm4lsmvcyosce25/mpi/2021.10.0/include -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux";
|
||||
# mark_description "8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux";
|
||||
# mark_description "/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-ax";
|
||||
# mark_description "ze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/x64 -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almal";
|
||||
# mark_description "inux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/l";
|
||||
# mark_description "inux/lib/oclfpga/host/linux64/lib -Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel";
|
||||
# mark_description "-oneapi-compilers-2023.2.1-axze7ocbc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/lib/oclfpga/linux64/lib ";
|
||||
# mark_description "-Wl,-rpath,/apps/SPACK/0.19.1/opt/linux-almalinux8-icelake/gcc-8.5.0/intel-oneapi-compilers-2023.2.1-axze7oc";
|
||||
# mark_description "bc5zpklxb6kr5h2d5hbpf2lxk/compiler/2023.2.1/linux/compiler/lib/intel64_lin -gcc-name=/usr/bin/gcc -gxx-name=";
|
||||
# mark_description "/usr/bin/g++ -S -fverbose-asm -D_GNU_SOURCE -DARRAY_ALIGNMENT=64 -O3 -xHost -qopt-zmm-usage=high -std=c99 -o";
|
||||
# mark_description " ICC/timing.s";
|
||||
.file "timing.c"
|
||||
.text
|
||||
..TXTST0:
|
||||
.L_2__routine_start_getTimeStamp_0:
|
||||
# -- Begin getTimeStamp
|
||||
.text
|
||||
# mark_begin;
|
||||
.align 16,0x90
|
||||
.globl getTimeStamp
|
||||
# --- getTimeStamp()
|
||||
getTimeStamp:
|
||||
..B1.1: # Preds ..B1.0
|
||||
# Execution count [1.00e+00]
|
||||
.cfi_startproc
|
||||
..___tag_value_getTimeStamp.1:
|
||||
..L2:
|
||||
#11.1
|
||||
subq $24, %rsp #11.1
|
||||
.cfi_def_cfa_offset 32
|
||||
movl $1, %edi #13.5
|
||||
lea (%rsp), %rsi #13.5
|
||||
# clock_gettime(clockid_t, struct timespec *)
|
||||
call clock_gettime #13.5
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B1.2: # Preds ..B1.1
|
||||
# Execution count [1.00e+00]
|
||||
vxorpd %xmm0, %xmm0, %xmm0 #14.40
|
||||
vxorpd %xmm1, %xmm1, %xmm1 #14.20
|
||||
vcvtsi2sdq 8(%rsp), %xmm0, %xmm0 #14.40
|
||||
vcvtsi2sdq (%rsp), %xmm1, %xmm1 #14.20
|
||||
vfmadd132sd .L_2il0floatpacket.0(%rip), %xmm1, %xmm0 #14.53
|
||||
addq $24, %rsp #14.53
|
||||
.cfi_def_cfa_offset 8
|
||||
ret #14.53
|
||||
.align 16,0x90
|
||||
# LOE
|
||||
.cfi_endproc
|
||||
# mark_end;
|
||||
.type getTimeStamp,@function
|
||||
.size getTimeStamp,.-getTimeStamp
|
||||
..LNgetTimeStamp.0:
|
||||
.data
|
||||
# -- End getTimeStamp
|
||||
.text
|
||||
.L_2__routine_start_getTimeResolution_1:
|
||||
# -- Begin getTimeResolution
|
||||
.text
|
||||
# mark_begin;
|
||||
.align 16,0x90
|
||||
.globl getTimeResolution
|
||||
# --- getTimeResolution()
|
||||
getTimeResolution:
|
||||
..B2.1: # Preds ..B2.0
|
||||
# Execution count [1.00e+00]
|
||||
.cfi_startproc
|
||||
..___tag_value_getTimeResolution.6:
|
||||
..L7:
|
||||
#18.1
|
||||
subq $24, %rsp #18.1
|
||||
.cfi_def_cfa_offset 32
|
||||
movl $1, %edi #20.5
|
||||
lea (%rsp), %rsi #20.5
|
||||
..___tag_value_getTimeResolution.9:
|
||||
# clock_getres(clockid_t, struct timespec *)
|
||||
call clock_getres #20.5
|
||||
..___tag_value_getTimeResolution.10:
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B2.2: # Preds ..B2.1
|
||||
# Execution count [1.00e+00]
|
||||
vxorpd %xmm0, %xmm0, %xmm0 #21.40
|
||||
vxorpd %xmm1, %xmm1, %xmm1 #21.20
|
||||
vcvtsi2sdq 8(%rsp), %xmm0, %xmm0 #21.40
|
||||
vcvtsi2sdq (%rsp), %xmm1, %xmm1 #21.20
|
||||
vfmadd132sd .L_2il0floatpacket.0(%rip), %xmm1, %xmm0 #21.53
|
||||
addq $24, %rsp #21.53
|
||||
.cfi_def_cfa_offset 8
|
||||
ret #21.53
|
||||
.align 16,0x90
|
||||
# LOE
|
||||
.cfi_endproc
|
||||
# mark_end;
|
||||
.type getTimeResolution,@function
|
||||
.size getTimeResolution,.-getTimeResolution
|
||||
..LNgetTimeResolution.1:
|
||||
.data
|
||||
# -- End getTimeResolution
|
||||
.text
|
||||
.L_2__routine_start_getTimeStamp__2:
|
||||
# -- Begin getTimeStamp_
|
||||
.text
|
||||
# mark_begin;
|
||||
.align 16,0x90
|
||||
.globl getTimeStamp_
|
||||
# --- getTimeStamp_()
|
||||
getTimeStamp_:
|
||||
..B3.1: # Preds ..B3.0
|
||||
# Execution count [1.00e+00]
|
||||
.cfi_startproc
|
||||
..___tag_value_getTimeStamp_.13:
|
||||
..L14:
|
||||
#25.1
|
||||
subq $24, %rsp #25.1
|
||||
.cfi_def_cfa_offset 32
|
||||
movl $1, %edi #26.12
|
||||
lea (%rsp), %rsi #26.12
|
||||
# clock_gettime(clockid_t, struct timespec *)
|
||||
call clock_gettime #26.12
|
||||
# LOE rbx rbp r12 r13 r14 r15
|
||||
..B3.2: # Preds ..B3.1
|
||||
# Execution count [1.00e+00]
|
||||
vxorpd %xmm0, %xmm0, %xmm0 #26.12
|
||||
vxorpd %xmm1, %xmm1, %xmm1 #26.12
|
||||
vcvtsi2sdq 8(%rsp), %xmm0, %xmm0 #26.12
|
||||
vcvtsi2sdq (%rsp), %xmm1, %xmm1 #26.12
|
||||
vfmadd132sd .L_2il0floatpacket.0(%rip), %xmm1, %xmm0 #26.12
|
||||
addq $24, %rsp #26.12
|
||||
.cfi_def_cfa_offset 8
|
||||
ret #26.12
|
||||
.align 16,0x90
|
||||
# LOE
|
||||
.cfi_endproc
|
||||
# mark_end;
|
||||
.type getTimeStamp_,@function
|
||||
.size getTimeStamp_,.-getTimeStamp_
|
||||
..LNgetTimeStamp_.2:
|
||||
.data
|
||||
# -- End getTimeStamp_
|
||||
.section .rodata, "a"
|
||||
.align 8
|
||||
.align 8
|
||||
.L_2il0floatpacket.0:
|
||||
.long 0xe826d695,0x3e112e0b
|
||||
.type .L_2il0floatpacket.0,@object
|
||||
.size .L_2il0floatpacket.0,8
|
||||
.data
|
||||
.section .note.GNU-stack, ""
|
||||
# End
|
@@ -33,7 +33,7 @@ $(BUILD_DIR)/%.o: %.c $(MAKE_DIR)/include_$(TAG).mk
|
||||
|
||||
$(BUILD_DIR)/%.s: %.c
|
||||
$(info ===> GENERATE ASM $@)
|
||||
$(CC) -S $(CPPFLAGS) $(CFLAGS) $< -o $@
|
||||
$(CC) -S -fverbose-asm $(CPPFLAGS) $(CFLAGS) $< -o $@
|
||||
|
||||
.PHONY: clean distclean tags info asm
|
||||
|
||||
|
Reference in New Issue
Block a user