Clarify in the docs that `mul_add` is not always faster.

More info:

- https://github.com/rust-lang/rust/issues/49842
- https://github.com/rust-lang/rust/pull/50572
This commit is contained in:
Corey Farwell 2018-05-20 11:55:54 -04:00
parent f4125621ac
commit 4775dee66b
3 changed files with 13 additions and 8 deletions

View File

@ -1237,8 +1237,10 @@ pub trait Float
fn is_sign_negative(self) -> bool; fn is_sign_negative(self) -> bool;
/// Fused multiply-add. Computes `(self * a) + b` with only one rounding /// Fused multiply-add. Computes `(self * a) + b` with only one rounding
/// error. This produces a more accurate result with better performance than /// error, yielding a more accurate result than an unfused multiply-add.
/// a separate multiplication operation followed by an add. ///
/// Using `mul_add` can be more performant than an unfused multiply-add if
/// the target architecture has a dedicated `fma` CPU instruction.
/// ///
/// ``` /// ```
/// use num_traits::Float; /// use num_traits::Float;

View File

@ -1,7 +1,8 @@
/// The fused multiply-add operation. /// Fused multiply-add. Computes `(self * a) + b` with only one rounding
/// Computes (self * a) + b with only one rounding error. /// error, yielding a more accurate result than an unfused multiply-add.
/// This produces a more accurate result with better performance ///
/// than a separate multiplication operation followed by an add. /// Using `mul_add` can be more performant than an unfused multiply-add if
/// the target architecture has a dedicated `fma` CPU instruction.
/// ///
/// Note that `A` and `B` are `Self` by default, but this is not mandatory. /// Note that `A` and `B` are `Self` by default, but this is not mandatory.
/// ///

View File

@ -215,8 +215,10 @@ pub trait Real
fn is_sign_negative(self) -> bool; fn is_sign_negative(self) -> bool;
/// Fused multiply-add. Computes `(self * a) + b` with only one rounding /// Fused multiply-add. Computes `(self * a) + b` with only one rounding
/// error. This produces a more accurate result with better performance than /// error, yielding a more accurate result than an unfused multiply-add.
/// a separate multiplication operation followed by an add. ///
/// Using `mul_add` can be more performant than an unfused multiply-add if
/// the target architecture has a dedicated `fma` CPU instruction.
/// ///
/// ``` /// ```
/// use num_traits::real::Real; /// use num_traits::real::Real;