1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
use core::f32 as f;
use ieee754::Ieee754;
#[inline]
pub fn log2(x: f32) -> f32 {
let (sign, exp, signif) = x.decompose_raw();
if sign {
f::NAN
} else if exp == 0 {
log2_exp_0(signif)
} else if exp == 0xFF {
if signif == 0 {
f::INFINITY
} else {
f::NAN
}
} else {
log2_raw(x)
}
}
#[inline(never)]
fn log2_exp_0(signif: u32) -> f32 {
if signif == 0 {
f::NEG_INFINITY
} else {
let zeros = signif.leading_zeros() - 9 + 1;
-126.0 - zeros as f32 + log2(f32::recompose_raw(false, 127, signif << zeros))
}
}
#[inline]
pub fn log2_raw(x: f32) -> f32 {
let (_sign, exp, signif) = x.decompose_raw();
debug_assert!(!_sign && 1 <= exp && exp <= 254);
let high_bit = ((signif >> 22) & 1) as u8;
let add_exp = (exp + high_bit) as i32 - 127;
let normalised = f32::recompose_raw(false, 0x7F ^ high_bit, signif) - 1.0;
const A: f32 = -0.6296735;
const B: f32 = 1.466967;
add_exp as f32 + normalised * (B + A * normalised)
}
#[cfg(test)]
mod tests {
use super::*;
use quickcheck as qc;
use std::f32 as f;
use ieee754::Ieee754;
#[test]
fn log2_rel_err_qc() {
fn prop(x: f32) -> qc::TestResult {
if !(x > 0.0) { return qc::TestResult::discard() }
let e = log2(x);
let t = x.log2();
qc::TestResult::from_bool(e.rel_error(t).abs() < 0.025)
}
qc::quickcheck(prop as fn(f32) -> qc::TestResult)
}
const PREC: u32 = 1 << 20;
#[test]
fn log2_rel_err_exhaustive() {
let mut max = 0.0;
for i in 0..PREC + 1 {
for j in -5..6 {
let x = (1.0 + i as f32 / PREC as f32) * 2f32.powi(j * 20);
let e = log2(x);
let t = x.log2();
let rel = e.rel_error(t).abs();
if rel > max { max = rel }
assert!(rel < 0.025 && (e - t).abs() < 0.009,
"{:.8}: {:.8}, {:.8}. {:.4}", x, e, t, rel);
}
}
println!("maximum {}", max);
}
#[test]
fn edge_cases() {
assert!(log2(f::NAN).is_nan());
assert!(log2(-1.0).is_nan());
assert!(log2(f::NEG_INFINITY).is_nan());
assert_eq!(log2(f::INFINITY), f::INFINITY);
assert_eq!(log2(0.0), f::NEG_INFINITY);
assert_eq!(log2(f32::recompose_raw(false, 0, 1)), -149.0);
}
#[test]
fn denormals() {
fn prop(x: u8, y: u16) -> bool {
let signif = ((x as u32) << 16) | (y as u32);
let mut x = f32::recompose_raw(false, 1, signif);
for _ in 0..23 {
assert!(x > 0.0);
let log = x.log2();
let e = log2(x);
let rel = e.rel_error(log).abs();
if rel >= 0.025 || (e - log).abs() > 0.009 {
return false
}
x /= 2.0;
}
true
}
qc::quickcheck(prop as fn(u8, u16) -> bool)
}
}