Skip to content

Commit

Permalink
added missing L() in all asm files used by skylake
Browse files Browse the repository at this point in the history
  • Loading branch information
dimpase committed Nov 23, 2017
1 parent 30dfa68 commit 6070d68
Show file tree
Hide file tree
Showing 23 changed files with 404 additions and 286 deletions.
118 changes: 118 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -284,6 +284,124 @@ tests/t-modlinv
tests/t-parity
tests/t-popc
tests/t-sub
tests/misc/t-locale
tests/misc/t-printf
tests/misc/t-scanf
tests/mpf/reuse
tests/mpf/t-add
tests/mpf/t-cmp_d
tests/mpf/t-cmp_si
tests/mpf/t-conv
tests/mpf/t-div
tests/mpf/t-dm2exp
tests/mpf/t-eq
tests/mpf/t-fits
tests/mpf/t-get_d
tests/mpf/t-get_d_2exp
tests/mpf/t-get_si
tests/mpf/t-get_ui
tests/mpf/t-gsprec
tests/mpf/t-inp_str
tests/mpf/t-int_p
tests/mpf/t-mul_ui
tests/mpf/t-muldiv
tests/mpf/t-set
tests/mpf/t-set_q
tests/mpf/t-set_si
tests/mpf/t-set_ui
tests/mpf/t-sqrt
tests/mpf/t-sqrt_ui
tests/mpf/t-sub
tests/mpf/t-trunc
tests/mpf/t-ui_div
tests/mpq/t-aors
tests/mpq/t-cmp
tests/mpq/t-cmp_si
tests/mpq/t-cmp_ui
tests/mpq/t-cmp_z
tests/mpq/t-equal
tests/mpq/t-get_d
tests/mpq/t-get_str
tests/mpq/t-inp_str
tests/mpq/t-md_2exp
tests/mpq/t-set_f
tests/mpq/t-set_str
tests/mpz/bit
tests/mpz/convert
tests/mpz/dive
tests/mpz/dive_ui
tests/mpz/io
tests/mpz/logic
tests/mpz/reuse
tests/mpz/st_hamdist
tests/mpz/st_popcount
tests/mpz/t-addsub
tests/mpz/t-aorsmul
tests/mpz/t-bin
tests/mpz/t-cdiv_ui
tests/mpz/t-cmp
tests/mpz/t-cmp_d
tests/mpz/t-cmp_si
tests/mpz/t-cong
tests/mpz/t-cong_2exp
tests/mpz/t-div_2exp
tests/mpz/t-divis
tests/mpz/t-divis_2exp
tests/mpz/t-export
tests/mpz/t-fac_ui
tests/mpz/t-fdiv
tests/mpz/t-fdiv_ui
tests/mpz/t-fib_ui
tests/mpz/t-fits
tests/mpz/t-gcd
tests/mpz/t-gcd_ui
tests/mpz/t-get_d
tests/mpz/t-get_d_2exp
tests/mpz/t-get_si
tests/mpz/t-get_sx
tests/mpz/t-get_ux
tests/mpz/t-hamdist
tests/mpz/t-import
tests/mpz/t-inp_str
tests/mpz/t-io_raw
tests/mpz/t-jac
tests/mpz/t-lcm
tests/mpz/t-likely_prime_p
tests/mpz/t-limbs
tests/mpz/t-lucnum_ui
tests/mpz/t-mfac_uiui
tests/mpz/t-mul
tests/mpz/t-mul_i
tests/mpz/t-next_prime_candidate
tests/mpz/t-oddeven
tests/mpz/t-perfpow
tests/mpz/t-perfsqr
tests/mpz/t-popcount
tests/mpz/t-pow
tests/mpz/t-powm
tests/mpz/t-powm_ui
tests/mpz/t-pprime_p
tests/mpz/t-primorial_ui
tests/mpz/t-root
tests/mpz/t-scan
tests/mpz/t-set_d
tests/mpz/t-set_f
tests/mpz/t-set_si
tests/mpz/t-set_str
tests/mpz/t-set_sx
tests/mpz/t-set_ux
tests/mpz/t-sizeinbase
tests/mpz/t-sqrtrem
tests/mpz/t-tdiv
tests/mpz/t-tdiv_ui
tests/mpz/t-trial_division
tests/rand/t-iset
tests/rand/t-lc2exp
tests/rand/t-mt
tests/rand/t-rand
tests/rand/t-urbui
tests/rand/t-urmui
tests/rand/t-urndmm
aclocal.m4
compile
configure
Expand Down
40 changes: 20 additions & 20 deletions mpn/x86_64/haswell/karaadd.asm
Original file line number Diff line number Diff line change
Expand Up @@ -52,7 +52,7 @@ mov $3,%ecx
sub %rdx,%rcx
mov $3,%edx
.align 16
.Lp: bt $2,%rbx
L(p): bt $2,%rbx
mov (%rdi,%rdx,8),%r8
adc (%rbp,%rcx,8),%r8
mov %r8,%r12
Expand Down Expand Up @@ -100,12 +100,12 @@ mov $3,%edx
mov %r14,16(%rbp,%rcx,8)
mov %r15,24(%rbp,%rcx,8)
add $4,%rcx
jnc .Lp
jnc L(p)
cmp $2,%rcx
jg .Lcase0
jz .Lcase1
jp .Lcase2
.Lcase3: #rcx=0
jg L(case0)
jz L(case1)
jp L(case2)
L(case3): #rcx=0
bt $2,%rbx
mov (%rdi,%rdx,8),%r8
adc (%rbp),%r8
Expand Down Expand Up @@ -144,8 +144,8 @@ jp .Lcase2
mov %r12,(%rbp)
mov %r13,8(%rbp)
mov %r14,16(%rbp)
jmp .Lfin
.Lcase2: #rcx=1
jmp L(fin)
L(case2): #rcx=1
bt $2,%rbx
mov (%rdi,%rdx,8),%r8
adc 8(%rbp),%r8
Expand Down Expand Up @@ -175,8 +175,8 @@ jp .Lcase2
add $2,%rdx
mov %r12,8(%rbp)
mov %r13,16(%rbp)
jmp .Lfin
.Lcase1: #rcx=2
jmp L(fin)
L(case1): #rcx=2
bt $2,%rbx
mov (%rdi,%rdx,8),%r8
adc 16(%rbp),%r8
Expand All @@ -197,11 +197,11 @@ jp .Lcase2
adc %rbx,%rbx
inc %rdx
mov %r12,(%rbp,%rcx,8)
.Lfin: mov $3,%rcx
.Lcase0: #rcx=3
L(fin): mov $3,%rcx
L(case0): #rcx=3
pop %r8
bt $0,%r8
jnc .Lnotodd
jnc L(notodd)
xor %r10,%r10
mov (%rbp,%rdx,8),%r8
mov 8(%rbp,%rdx,8),%r9
Expand All @@ -211,24 +211,24 @@ jp .Lcase2
add %r8,24(%rbp)
adc %r9,32(%rbp)
adc %r10,40(%rbp)
.L7: adcq $0,24(%rbp,%rcx,8)
L(l7): adcq $0,24(%rbp,%rcx,8)
inc %rcx
jc .L7
jc L(l7)
mov $3,%rcx
.Lnotodd:and $3,%rax
L(notodd):and $3,%rax
popcnt %rax,%r8
bt $2,%rbx
adc $0,%r8
adc %r8,(%rdi,%rdx,8)
.L1: adcq $0,8(%rdi,%rdx,8)
L(l1): adcq $0,8(%rdi,%rdx,8)
inc %rdx
jc .L1
jc L(l1)
and $7,%rbx
popcnt %rbx,%r8
add %r8,24(%rbp)
.L2: adcq $0,8(%rbp,%rcx,8)
L(l2): adcq $0,8(%rbp,%rcx,8)
inc %rcx
jc .L2
jc L(l2)
pop %r15
pop %r14
pop %r13
Expand Down
Loading

0 comments on commit 6070d68

Please sign in to comment.