|
| 1 | +use core::f64; |
| 2 | + |
| 3 | +const IVLN2HI: f64 = 1.44269504072144627571e+00; /* 0x3ff71547, 0x65200000 */ |
| 4 | +const IVLN2LO: f64 = 1.67517131648865118353e-10; /* 0x3de705fc, 0x2eefa200 */ |
| 5 | +const LG1: f64 = 6.666666666666735130e-01; /* 3FE55555 55555593 */ |
| 6 | +const LG2: f64 = 3.999999999940941908e-01; /* 3FD99999 9997FA04 */ |
| 7 | +const LG3: f64 = 2.857142874366239149e-01; /* 3FD24924 94229359 */ |
| 8 | +const LG4: f64 = 2.222219843214978396e-01; /* 3FCC71C5 1D8E78AF */ |
| 9 | +const LG5: f64 = 1.818357216161805012e-01; /* 3FC74664 96CB03DE */ |
| 10 | +const LG6: f64 = 1.531383769920937332e-01; /* 3FC39A09 D078C69F */ |
| 11 | +const LG7: f64 = 1.479819860511658591e-01; /* 3FC2F112 DF3E5244 */ |
| 12 | + |
| 13 | +pub fn log2(mut x: f64) -> f64 { |
| 14 | + let x1p54 = f64::from_bits(0x4350000000000000); // 0x1p54 === 2 ^ 54 |
| 15 | + |
| 16 | + let mut ui: u64 = x.to_bits(); |
| 17 | + let hfsq: f64; |
| 18 | + let f: f64; |
| 19 | + let s: f64; |
| 20 | + let z: f64; |
| 21 | + let r: f64; |
| 22 | + let mut w: f64; |
| 23 | + let t1: f64; |
| 24 | + let t2: f64; |
| 25 | + let y: f64; |
| 26 | + let mut hi: f64; |
| 27 | + let lo: f64; |
| 28 | + let mut val_hi: f64; |
| 29 | + let mut val_lo: f64; |
| 30 | + let mut hx: u32; |
| 31 | + let mut k: i32; |
| 32 | + |
| 33 | + hx = (ui >> 32) as u32; |
| 34 | + k = 0; |
| 35 | + if hx < 0x00100000 || (hx >> 31) > 0 { |
| 36 | + if ui << 1 == 0 { |
| 37 | + return -1. / (x * x); /* log(+-0)=-inf */ |
| 38 | + } |
| 39 | + if (hx >> 31) > 0 { |
| 40 | + return (x - x) / 0.0; /* log(-#) = NaN */ |
| 41 | + } |
| 42 | + /* subnormal number, scale x up */ |
| 43 | + k -= 54; |
| 44 | + x *= x1p54; |
| 45 | + ui = x.to_bits(); |
| 46 | + hx = (ui >> 32) as u32; |
| 47 | + } else if hx >= 0x7ff00000 { |
| 48 | + return x; |
| 49 | + } else if hx == 0x3ff00000 && ui << 32 == 0 { |
| 50 | + return 0.; |
| 51 | + } |
| 52 | + |
| 53 | + /* reduce x into [sqrt(2)/2, sqrt(2)] */ |
| 54 | + hx += 0x3ff00000 - 0x3fe6a09e; |
| 55 | + k += (hx >> 20) as i32 - 0x3ff; |
| 56 | + hx = (hx & 0x000fffff) + 0x3fe6a09e; |
| 57 | + ui = (hx as u64) << 32 | (ui & 0xffffffff); |
| 58 | + x = f64::from_bits(ui); |
| 59 | + |
| 60 | + f = x - 1.0; |
| 61 | + hfsq = 0.5 * f * f; |
| 62 | + s = f / (2.0 + f); |
| 63 | + z = s * s; |
| 64 | + w = z * z; |
| 65 | + t1 = w * (LG2 + w * (LG4 + w * LG6)); |
| 66 | + t2 = z * (LG1 + w * (LG3 + w * (LG5 + w * LG7))); |
| 67 | + r = t2 + t1; |
| 68 | + |
| 69 | + /* hi+lo = f - hfsq + s*(hfsq+R) ~ log(1+f) */ |
| 70 | + hi = f - hfsq; |
| 71 | + ui = hi.to_bits(); |
| 72 | + ui &= (-1i64 as u64) << 32; |
| 73 | + hi = f64::from_bits(ui); |
| 74 | + lo = f - hi - hfsq + s * (hfsq + r); |
| 75 | + |
| 76 | + val_hi = hi * IVLN2HI; |
| 77 | + val_lo = (lo + hi) * IVLN2LO + lo * IVLN2HI; |
| 78 | + |
| 79 | + /* spadd(val_hi, val_lo, y), except for not using double_t: */ |
| 80 | + y = k.into(); |
| 81 | + w = y + val_hi; |
| 82 | + val_lo += (y - w) + val_hi; |
| 83 | + val_hi = w; |
| 84 | + |
| 85 | + return val_lo + val_hi; |
| 86 | +} |
0 commit comments