Added fused multiple-add method to Float4.
This commit is contained in:
parent
48e015996f
commit
b3cc5c070a
|
@ -232,6 +232,24 @@ mod x86_64_sse {
|
|||
data: unsafe { _mm_sqrt_ps(self.data) },
|
||||
}
|
||||
}
|
||||
|
||||
/// Performs a fused multiply add.
|
||||
///
|
||||
/// i.e. self * b + c
|
||||
#[inline(always)]
|
||||
pub fn fmadd(&self, b: Float4, c: Float4) -> Float4 {
|
||||
#[cfg(target_feature = "fma")]
|
||||
{
|
||||
use std::arch::x86_64::_mm_fmadd_ps;
|
||||
Float4 {
|
||||
data: unsafe { _mm_fmadd_ps(self.data, b.data, c.data) },
|
||||
}
|
||||
}
|
||||
#[cfg(not(target_feature = "fma"))]
|
||||
{
|
||||
(*self * b) + c
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
impl PartialEq for Float4 {
|
||||
|
@ -886,6 +904,14 @@ mod fallback {
|
|||
self.get_3().sqrt(),
|
||||
)
|
||||
}
|
||||
|
||||
/// Performs a fused multiply add.
|
||||
///
|
||||
/// i.e. self * b + c
|
||||
#[inline(always)]
|
||||
pub fn fmadd(&self, b: Float4, c: Float4) -> Float4 {
|
||||
(*self * b) + c
|
||||
}
|
||||
}
|
||||
|
||||
impl PartialEq for Float4 {
|
||||
|
|
Loading…
Reference in New Issue
Block a user