Skip to content

Commit 7eb36f5

Browse files
committed
Add newlib sqrtf
1 parent 024580d commit 7eb36f5

File tree

3 files changed

+207
-0
lines changed

3 files changed

+207
-0
lines changed

src/fdlibm.rs

+89
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,89 @@
1+
/* @(#)fdlibm.h 5.1 93/09/24 */
2+
/*
3+
* ====================================================
4+
* Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
5+
*
6+
* Developed at SunPro, a Sun Microsystems, Inc. business.
7+
* Permission to use, copy, modify, and distribute this
8+
* software is freely granted, provided that this notice
9+
* is preserved.
10+
* ====================================================
11+
*/
12+
13+
#![allow(dead_code)] // not deadcode, just for debug and warnings
14+
15+
/* Most routines need to check whether a float is finite, infinite, or not a
16+
number, and many need to know whether the result of an operation will
17+
overflow. These conditions depend on whether the largest exponent is
18+
used for NaNs & infinities, or whether it's used for finite numbers. */
19+
20+
/// True if a positive float with bitmask X is finite.
21+
#[inline]
22+
#[allow(non_snake_case)]
23+
pub fn FLT_UWORD_IS_FINITE(x: u32) -> bool {
24+
x < 0x7f80_0000
25+
}
26+
27+
/// True if a positive float with bitmask X is not a number.
28+
#[inline]
29+
#[allow(non_snake_case)]
30+
pub fn FLT_UWORD_IS_NAN(x: u32) -> bool {
31+
x > 0x7f80_0000
32+
}
33+
34+
/// True if a positive float with bitmask X is +infinity.
35+
#[inline]
36+
#[allow(non_snake_case)]
37+
pub fn FLT_UWORD_IS_INFINITE(x: u32) -> bool {
38+
x == 0x7f80_0000
39+
}
40+
41+
/// The bitmask of FLT_MAX.
42+
pub const FLT_UWORD_MAX: u32 = 0x7f7f_ffff;
43+
/// The bitmask of FLT_MAX/2.
44+
pub const FLT_UWORD_HALF_MAX: u32 = FLT_UWORD_MAX - (1 << 23);
45+
/// The bitmask of the largest finite exponent (129 if the largest
46+
/// exponent is used for finite numbers, 128 otherwise).
47+
pub const FLT_UWORD_EXP_MAX: u32 = 0x4300_0000;
48+
/// The bitmask of log(FLT_MAX), rounded down. This value is the largest
49+
/// input that can be passed to exp() without producing overflow.
50+
pub const FLT_UWORD_LOG_MAX: u32 = 0x42b1_7217;
51+
/// The bitmask of log(2*FLT_MAX), rounded down. This value is the
52+
/// largest input than can be passed to cosh() without producing
53+
/// overflow.
54+
pub const FLT_UWORD_LOG_2MAX: u32 = 0x42b2_d4fc;
55+
/// The largest biased exponent that can be used for finite numbers
56+
/// (255 if the largest exponent is used for finite numbers, 254
57+
/// otherwise)
58+
pub const FLT_LARGEST_EXP: u32 = FLT_UWORD_MAX >> 23;
59+
pub const HUGE: f32 = 3.402_823_466_385_288_60e+38;
60+
61+
/* Many routines check for zero and subnormal numbers. Such things depend
62+
on whether the target supports denormals or not */
63+
64+
/// True if a positive float with bitmask X is +0. Without denormals,
65+
/// any float with a zero exponent is a +0 representation. With
66+
/// denormals, the only +0 representation is a 0 bitmask.
67+
#[inline]
68+
#[allow(non_snake_case)]
69+
pub fn FLT_UWORD_IS_ZERO(x: u32) -> bool {
70+
x == 0
71+
}
72+
73+
/// True if a non-zero positive float with bitmask X is subnormal.
74+
/// (Routines should check for zeros first.)
75+
#[inline]
76+
#[allow(non_snake_case)]
77+
pub fn FLT_UWORD_IS_SUBNORMAL(x: u32) -> bool {
78+
x < 0x0080_0000
79+
}
80+
81+
/// The bitmask of the smallest float above +0. Call this number REAL_FLT_MIN...
82+
pub const FLT_UWORD_MIN: usize = 0x0000_0001;
83+
/// The bitmask of the float representation of REAL_FLT_MIN's exponent.
84+
pub const FLT_UWORD_EXP_MIN: usize = 0x4316_0000;
85+
/// The bitmask of |log(REAL_FLT_MIN)|, rounding down.
86+
pub const FLT_UWORD_LOG_MIN: usize = 0x42cf_f1b5;
87+
/// REAL_FLT_MIN's exponent - EXP_BIAS (1 if denormals are not supported,
88+
/// -22 if they are).
89+
pub const FLT_SMALLEST_EXP: isize = -22;

src/math/mod.rs

+3
Original file line numberDiff line numberDiff line change
@@ -332,3 +332,6 @@ fn with_set_low_word(f: f64, lo: u32) -> f64 {
332332
fn combine_words(hi: u32, lo: u32) -> f64 {
333333
f64::from_bits((hi as u64) << 32 | lo as u64)
334334
}
335+
336+
#[path = "../fdlibm.rs"]
337+
mod fdlibm;

src/math/sqrtf.rs

+115
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,115 @@
1+
/* ef_sqrtf.c -- float version of e_sqrt.c.
2+
* Conversion to float by Ian Lance Taylor, Cygnus Support, [email protected].
3+
*/
4+
5+
/*
6+
* ====================================================
7+
* Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
8+
*
9+
* Developed at SunPro, a Sun Microsystems, Inc. business.
10+
* Permission to use, copy, modify, and distribute this
11+
* software is freely granted, provided that this notice
12+
* is preserved.
13+
* ====================================================
14+
*/
15+
16+
const ONE: f32 = 1.0;
17+
const TINY: f32 = 1.0e-30;
18+
19+
#[inline]
20+
#[cfg_attr(all(test, assert_no_panic), no_panic::no_panic)]
21+
pub fn sqrtf(x: f32) -> f32 {
22+
use super::fdlibm::{FLT_UWORD_IS_FINITE, FLT_UWORD_IS_SUBNORMAL, FLT_UWORD_IS_ZERO};
23+
// On wasm32 we know that LLVM's intrinsic will compile to an optimized
24+
// `f32.sqrt` native instruction, so we can leverage this for both code size
25+
// and speed.
26+
llvm_intrinsically_optimized! {
27+
#[cfg(target_arch = "wasm32")] {
28+
return if x < 0.0 {
29+
::core::f32::NAN
30+
} else {
31+
unsafe { ::core::intrinsics::sqrtf32(x) }
32+
}
33+
}
34+
}
35+
36+
let mut z: f32;
37+
38+
let mut r: u32;
39+
let hx: u32;
40+
41+
let mut ix: i32;
42+
let mut s: i32;
43+
let mut q: i32;
44+
let mut m: i32;
45+
let mut t: i32;
46+
let mut i: i32;
47+
48+
ix = x.to_bits() as i32;
49+
hx = ix as u32 & 0x7fff_ffff;
50+
51+
/* take care of Inf and NaN */
52+
if !FLT_UWORD_IS_FINITE(hx) {
53+
return x * x + x; /* sqrt(NaN)=NaN, sqrt(+inf)=+inf, sqrt(-inf)=sNaN */
54+
}
55+
56+
/* take care of zero and -ves */
57+
if FLT_UWORD_IS_ZERO(hx) {
58+
return x; /* sqrt(+-0) = +-0 */
59+
}
60+
if ix < 0 {
61+
return (x - x) / (x - x); /* sqrt(-ve) = sNaN */
62+
}
63+
64+
/* normalize x */
65+
m = ix >> 23;
66+
if FLT_UWORD_IS_SUBNORMAL(hx) {
67+
/* subnormal x */
68+
i = 0;
69+
while ix & 0x0080_0000 == 0 {
70+
ix <<= 1;
71+
i += 1;
72+
}
73+
m -= i - 1;
74+
}
75+
m -= 127; /* unbias exponent */
76+
ix = (ix & 0x007f_ffff) | 0x0080_0000;
77+
/* odd m, double x to make it even */
78+
if m & 1 == 1 {
79+
ix += ix;
80+
}
81+
m >>= 1; /* m = [m/2] */
82+
83+
/* generate sqrt(x) bit by bit */
84+
ix += ix;
85+
q = 0;
86+
s = 0; /* q = sqrt(x) */
87+
r = 0x0100_0000; /* r = moving bit from right to left */
88+
89+
while r != 0 {
90+
t = s + r as i32;
91+
if t <= ix {
92+
s = t + r as i32;
93+
ix -= t;
94+
q += r as i32;
95+
}
96+
ix += ix;
97+
r >>= 1;
98+
}
99+
100+
/* use floating add to find out rounding direction */
101+
if ix != 0 {
102+
z = ONE - TINY; /* trigger inexact flag */
103+
if z >= ONE {
104+
z = ONE + TINY;
105+
if z > ONE {
106+
q += 2;
107+
} else {
108+
q += q & 1;
109+
}
110+
}
111+
}
112+
ix = (q >> 1) + 0x3f00_0000;
113+
ix += m << 23;
114+
f32::from_bits(ix as u32)
115+
}

0 commit comments

Comments
 (0)