-
Notifications
You must be signed in to change notification settings - Fork 73
/
Copy pathmul_adde.rs
48 lines (43 loc) · 1.97 KB
/
mul_adde.rs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
//! Implements vertical (lane-wise) floating-point `mul_adde`.
macro_rules! impl_math_float_mul_adde {
([$elem_ty:ident; $elem_count:expr]: $id:ident | $test_tt:tt) => {
impl $id {
/// Fused multiply add estimate: ~= `self * y + z`
///
/// While fused multiply-add (`fma`) has infinite precision,
/// `mul_adde` has _at worst_ the same precision of a multiply followed by an add.
/// This might be more efficient on architectures that do not have an `fma` instruction.
#[inline]
pub fn mul_adde(self, y: Self, z: Self) -> Self {
use crate::codegen::math::float::mul_adde::MulAddE;
MulAddE::mul_adde(self, y, z)
}
}
test_if!{
$test_tt:
paste::item! {
pub mod [<$id _math_mul_adde>] {
use super::*;
#[cfg_attr(not(target_arch = "wasm32"), test)] #[cfg_attr(target_arch = "wasm32", wasm_bindgen_test)]
fn mul_adde() {
let z = $id::splat(0 as $elem_ty);
let o = $id::splat(1 as $elem_ty);
let t = $id::splat(2 as $elem_ty);
let t3 = $id::splat(3 as $elem_ty);
let f = $id::splat(4 as $elem_ty);
assert_eq!(z, z.mul_adde(z, z));
assert_eq!(o, o.mul_adde(o, z));
assert_eq!(o, o.mul_adde(z, o));
assert_eq!(o, z.mul_adde(o, o));
assert_eq!(t, o.mul_adde(o, o));
assert_eq!(t, o.mul_adde(t, z));
assert_eq!(t, t.mul_adde(o, z));
assert_eq!(f, t.mul_adde(t, z));
assert_eq!(f, t.mul_adde(o, t));
assert_eq!(t3, t.mul_adde(o, o));
}
}
}
}
};
}