projects
/
musl
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
make type of st_dev explicitly dev_t in x86_64 stat.h
[musl]
/
src
/
math
/
i386
/
exp.s
diff --git
a/src/math/i386/exp.s
b/src/math/i386/exp.s
index
ca0de1d
..
abb9036
100644
(file)
--- a/
src/math/i386/exp.s
+++ b/
src/math/i386/exp.s
@@
-2,7
+2,18
@@
.type expm1f,@function
expm1f:
flds 4(%esp)
.type expm1f,@function
expm1f:
flds 4(%esp)
- jmp 1f
+ mov 4(%esp),%eax
+ add %eax,%eax
+ cmp $0x01000000,%eax
+ jae 1f
+ # subnormal x, return x with underflow
+ fnstsw %ax
+ and $16,%ax
+ jnz 2f
+ fld %st(0)
+ fmul %st(1)
+ fstps 4(%esp)
+2: ret
.global expm1l
.type expm1l,@function
.global expm1l
.type expm1l,@function
@@
-14,10
+25,32
@@
expm1l:
.type expm1,@function
expm1:
fldl 4(%esp)
.type expm1,@function
expm1:
fldl 4(%esp)
+ mov 8(%esp),%eax
+ add %eax,%eax
+ cmp $0x00200000,%eax
+ jae 1f
+ # subnormal x, return x with underflow
+ fnstsw %ax
+ and $16,%ax
+ jnz 2f
+ fsts 4(%esp)
+2: ret
1: fldl2e
fmulp
1: fldl2e
fmulp
+ mov $0xc2820000,%eax
+ push %eax
+ flds (%esp)
+ pop %eax
+ fucomp %st(1)
+ fnstsw %ax
+ sahf
fld1
fld1
- fld %st(1)
+ jb 1f
+ # x*log2e < -65, return -1 without underflow
+ fstp %st(1)
+ fchs
+ ret
+1: fld %st(1)
fabs
fucom %st(1)
fnstsw %ax
fabs
fucom %st(1)
fnstsw %ax
@@
-50,12
+83,6
@@
expf:
flds 4(%esp)
jmp 2f
flds 4(%esp)
jmp 2f
-.global expl
-.type expl,@function
-expl:
- fldt 4(%esp)
- jmp 2f
-
.global exp
.type exp,@function
exp:
.global exp
.type exp,@function
exp:
@@
-68,52
+95,55
@@
exp:
.type exp2,@function
exp2:
fldl 4(%esp)
.type exp2,@function
exp2:
fldl 4(%esp)
-1: pushl $0x467ff000
- flds (%esp)
- xorl %eax,%eax
- pushl $0x80000000
- push %eax
+1: sub $12,%esp
+ fld %st(0)
+ fstpt (%esp)
+ mov 8(%esp),%ax
+ and $0x7fff,%ax
+ cmp $0x3fff+13,%ax
+ jb 4f # |x| < 8192
+ cmp $0x3fff+15,%ax
+ jae 3f # |x| >= 32768
+ fsts (%esp)
+ cmpl $0xc67ff800,(%esp)
+ jb 2f # x > -16382
+ movl $0x5f000000,(%esp)
+ flds (%esp) # 0x1p63
fld %st(1)
fld %st(1)
- fabs
- fucom %st(1)
+ fsub %st(1)
+ faddp
+ fucomp %st(1)
fnstsw
fnstsw
- fstp %st(0)
- fstp %st(0)
sahf
sahf
- ja 2f
- fld %st(0)
- fistpl 8(%esp)
- fildl 8(%esp)
- fxch %st(1)
- fsub %st(1)
- mov $0x3fff,%eax
- add %eax,8(%esp)
+ je 2f # x - 0x1p63 + 0x1p63 == x
+ movl $1,(%esp)
+ flds (%esp) # 0x1p-149
+ fdiv %st(1)
+ fstps (%esp) # raise underflow
+2: fld1
+ fld %st(1)
+ frndint
+ fxch %st(2)
+ fsub %st(2) # st(0)=x-rint(x), st(1)=1, st(2)=rint(x)
f2xm1
f2xm1
- fld1
- faddp
- fldt (%esp)
- fmulp
+ faddp # 2^(x-rint(x))
+1: fscale
fstp %st(1)
add $12,%esp
ret
fstp %st(1)
add $12,%esp
ret
-
-2: fld %st(0)
+3: xor %eax,%eax
+4: cmp $0x3fff-64,%ax
+ fld1
+ jb 1b # |x| < 0x1p-64
fstpt (%esp)
fstpt (%esp)
- mov 9(%esp),%ah
- and $0x7f,%ah
- cmp $0x7f,%ah
- jne 1f
- decb 9(%esp)
- fstp %st(0)
- fldt (%esp)
-1: fld %st(0)
- frndint
- fxch %st(1)
- fsub %st(1)
+ fistl 8(%esp)
+ fildl 8(%esp)
+ fsubrp %st(1)
+ addl $0x3fff,8(%esp)
f2xm1
fld1
f2xm1
fld1
- faddp
- f
scale
- f
stp %st(1)
+ faddp
# 2^(x-rint(x))
+ f
ldt (%esp) # 2^rint(x)
+ f
mulp
add $12,%esp
ret
add $12,%esp
ret