123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251 |
- # mark_description "Intel(R) C Intel(R) 64 Compiler Classic for applications running on Intel(R) 64, Version 2021.3.0 Build 2021";
- # mark_description "0609_000000";
- # mark_description "-m64 -c -Wall -S -fverbose-asm -qopt-report-embed";
- .file "d4dag.c"
- .text
- ..TXTST0:
- .L_2__routine_start_d4d_version_0:
- # -- Begin d4d_version
- .text
- # mark_begin;
- .align 16,0x90
- .globl d4d_version
- # --- d4d_version(void)
- d4d_version:
- ..B1.1: # Preds ..B1.0
- # Execution count [1.00e+00]
- .cfi_startproc
- ..___tag_value_d4d_version.1:
- ..L2:
- #86.1
- movl $10, %eax #87.9
- ret #87.9
- .align 16,0x90
- # LOE
- .cfi_endproc
- # mark_end;
- .type d4d_version,@function
- .size d4d_version,.-d4d_version
- ..LNd4d_version.0:
- .data
- # -- End d4d_version
- .text
- .L_2__routine_start_d4d_deinit_1:
- # -- Begin d4d_deinit
- .text
- # mark_begin;
- .align 16,0x90
- .globl d4d_deinit
- # --- d4d_deinit(void)
- d4d_deinit:
- ..B2.1: # Preds ..B2.0
- # Execution count [1.00e+00]
- .cfi_startproc
- ..___tag_value_d4d_deinit.4:
- ..L5:
- #124.1
- pushq %rsi #124.1
- .cfi_def_cfa_offset 16
- movq d4d__main(%rip), %rdi #126.7
- testq %rdi, %rdi #126.7
- jne ..B2.3 # Prob 67% #126.7
- # LOE rbx rbp rdi r12 r13 r14 r15
- ..B2.2: # Preds ..B2.1
- # Execution count [3.26e-01]
- xorl %eax, %eax #127.10
- popq %rcx #127.10
- .cfi_def_cfa_offset 8
- ret #127.10
- .cfi_def_cfa_offset 16
- # LOE
- ..B2.3: # Preds ..B2.1
- # Execution count [6.74e-01]
- ..___tag_value_d4d_deinit.9:
- call *8(%rdi) #131.2
- ..___tag_value_d4d_deinit.10:
- # LOE rbx rbp r12 r13 r14 r15
- ..B2.4: # Preds ..B2.3
- # Execution count [6.74e-01]
- movq $0, d4d__main(%rip) #132.2
- xorl %eax, %eax #133.9
- popq %rcx #133.9
- .cfi_def_cfa_offset 8
- ret #133.9
- .align 16,0x90
- # LOE
- .cfi_endproc
- # mark_end;
- .type d4d_deinit,@function
- .size d4d_deinit,.-d4d_deinit
- ..LNd4d_deinit.1:
- .data
- # -- End d4d_deinit
- .text
- .L_2__routine_start_d4d_init_2:
- # -- Begin d4d_init
- .text
- # mark_begin;
- .align 16,0x90
- .globl d4d_init
- # --- d4d_init(void *(*)(unsigned int), void (*)(void *))
- d4d_init:
- # parameter 1: %rdi
- # parameter 2: %rsi
- ..B3.1: # Preds ..B3.0
- # Execution count [1.00e+00]
- .cfi_startproc
- ..___tag_value_d4d_init.13:
- ..L14:
- #101.1
- pushq %r14 #101.1
- .cfi_def_cfa_offset 16
- .cfi_offset 14, -16
- pushq %r15 #101.1
- .cfi_def_cfa_offset 24
- .cfi_offset 15, -24
- pushq %rsi #101.1
- .cfi_def_cfa_offset 32
- movq %rdi, %r14 #101.1
- movq %rsi, %r15 #101.1
- testq %r14, %r14 #103.6
- je ..B3.8 # Prob 5% #103.6
- # LOE rbx rbp r12 r13 r14 r15
- ..B3.2: # Preds ..B3.1
- # Execution count [9.50e-01]
- testq %r15, %r15 #106.7
- je ..B3.8 # Prob 15% #106.7
- # LOE rbx rbp r12 r13 r14 r15
- ..B3.3: # Preds ..B3.2
- # Execution count [7.99e-01]
- movl $16, %edi #109.35
- ..___tag_value_d4d_init.20:
- call *%r14 #109.35
- ..___tag_value_d4d_init.21:
- # LOE rax rbx rbp r12 r13 r14 r15
- ..B3.4: # Preds ..B3.3
- # Execution count [7.99e-01]
- movq %rax, d4d__main(%rip) #109.2
- testq %rax, %rax #110.7
- jne ..B3.6 # Prob 67% #110.7
- # LOE rax rbx rbp r12 r13 r14 r15
- ..B3.5: # Preds ..B3.4
- # Execution count [2.61e-01]
- movl $-2, %eax #111.10
- popq %rcx #111.10
- .cfi_def_cfa_offset 24
- .cfi_restore 15
- popq %r15 #111.10
- .cfi_def_cfa_offset 16
- .cfi_restore 14
- popq %r14 #111.10
- .cfi_def_cfa_offset 8
- ret #111.10
- .cfi_def_cfa_offset 32
- .cfi_offset 14, -16
- .cfi_offset 15, -24
- # LOE rbx rbp r12 r13 eax
- ..B3.6: # Preds ..B3.4
- # Execution count [5.39e-01]
- ..L30:
- # optimization report
- # LOOP WAS COMPLETELY UNROLLED
- # LOOP WAS VECTORIZED
- # VECTORIZATION HAS UNALIGNED MEMORY REFERENCES
- # VECTORIZATION SPEEDUP COEFFECIENT 2.667969
- # LOOP HAS ONE VECTOR ITERATION
- # VECTOR LENGTH 16
- # NORMALIZED VECTORIZATION OVERHEAD 0.812500
- # MAIN VECTOR TYPE: 8-bits integer
- # THE LOOP HAS FP INDUCTION
- pxor %xmm0, %xmm0 #144.4
- movdqu %xmm0, (%rax) #144.4
- movq %r14, (%rax) #115.2
- movq %r15, 8(%rax) #116.2
- xorl %eax, %eax #117.9
- # LOE rbx rbp r12 r13 eax
- ..B3.7: # Preds ..B3.6
- # Execution count [7.99e-01]
- popq %rcx #111.10
- .cfi_def_cfa_offset 24
- .cfi_restore 15
- popq %r15 #111.10
- .cfi_def_cfa_offset 16
- .cfi_restore 14
- popq %r14 #111.10
- .cfi_def_cfa_offset 8
- ret #111.10
- .cfi_def_cfa_offset 32
- .cfi_offset 14, -16
- .cfi_offset 15, -24
- # LOE
- ..B3.8: # Preds ..B3.2 ..B3.1
- # Execution count [5.04e-02]: Infreq
- movl $-1, %eax #104.9
- popq %rcx #104.9
- .cfi_def_cfa_offset 24
- .cfi_restore 15
- popq %r15 #104.9
- .cfi_def_cfa_offset 16
- .cfi_restore 14
- popq %r14 #104.9
- .cfi_def_cfa_offset 8
- ret #104.9
- .align 16,0x90
- # LOE
- .cfi_endproc
- # mark_end;
- .type d4d_init,@function
- .size d4d_init,.-d4d_init
- ..LNd4d_init.2:
- .data
- # -- End d4d_init
- .bss
- .align 8
- .align 8
- d4d__main:
- .type d4d__main,@object
- .size d4d__main,8
- .space 8 # pad
- .data
- .section .debug_opt_report, ""
- ..L45:
- .ascii ".itt_notify_tab\0"
- .word 258
- .word 48
- .long 2
- .long ..L46 - ..L45
- .long 48
- .long ..L47 - ..L45
- .long 25
- .long 0x00000008,0x00000000
- .long 0
- .long 0
- .long 0
- .long 1
- .quad ..L30
- .long 28
- .long 5
- ..L46:
- .long 1769238639
- .long 1635412333
- .long 1852795252
- .long 1885696607
- .long 1601466991
- .long 1936876918
- .long 7237481
- .long 1769238639
- .long 1635412333
- .long 1852795252
- .long 1885696607
- .long 7631471
- ..L47:
- .long -2045771008
- .long -2146430206
- .long -1065320320
- .long -2139062144
- .long -1783594366
- .long -2137151032
- .byte 16
- .section .note.GNU-stack, ""
- # End
|