num_dual/
lib.rs

1//! Generalized, recursive, scalar and vector (hyper) dual numbers for the automatic and exact calculation of (partial) derivatives.
2//!
3//! # Example
4//! This example defines a generic scalar and a generic vector function that can be called using any (hyper-) dual number and automatically calculates derivatives.
5//! ```
6//! use num_dual::*;
7//! use nalgebra::SVector;
8//!
9//! fn foo<D: DualNum<f64>>(x: D) -> D {
10//!     x.powi(3)
11//! }
12//!
13//! fn bar<D: DualNum<f64>, const N: usize>(x: SVector<D, N>) -> D {
14//!     x.dot(&x).sqrt()
15//! }
16//!
17//! fn main() {
18//!     // Calculate a simple derivative
19//!     let (f, df) = first_derivative(foo, 5.0);
20//!     assert_eq!(f, 125.0);
21//!     assert_eq!(df, 75.0);
22//!
23//!     // Manually construct the dual number
24//!     let x = Dual64::new(5.0, 1.0);
25//!     println!("{}", foo(x));                     // 125 + 75ε
26//!
27//!     // Calculate a gradient
28//!     let (f, g) = gradient(bar, &SVector::from([4.0, 3.0]));
29//!     assert_eq!(f, 5.0);
30//!     assert_eq!(g[0], 0.8);
31//!
32//!     // Calculate a Hessian
33//!     let (f, g, h) = hessian(bar, &SVector::from([4.0, 3.0]));
34//!     println!("{h}");                            // [[0.072, -0.096], [-0.096, 0.128]]
35//!
36//!     // for x=cos(t) calculate the third derivative of foo w.r.t. t
37//!     let (f0, f1, f2, f3) = third_derivative(|t| foo(t.cos()), 1.0);
38//!     println!("{f3}");                           // 1.5836632930100278
39//! }
40//! ```
41//!
42//! # Usage
43//! There are two ways to use the data structures and functions provided in this crate:
44//! 1. (recommended) Using the provided functions for explicit ([`first_derivative`], [`gradient`], ...) and
45//!    implicit ([`implicit_derivative`], [`implicit_derivative_binary`], [`implicit_derivative_vec`]) functions.
46//! 2. (for experienced users) Using the different dual number types ([`Dual`], [`HyperDual`], [`DualVec`], ...) directly.
47//!
48//! The following examples and explanations focus on the first way.
49//!
50//! # Derivatives of explicit functions
51//! To be able to calculate the derivative of a function, it needs to be generic over the type of dual number used.
52//! Most commonly this would look like this:
53//! ```compile_fail
54//! fn foo<D: DualNum<f64> + Copy>(x: X) -> O {...}
55//! ```
56//! Of course, the function could also use single precision ([`f32`]) or be generic over the precision (`F:` [`DualNumFloat`]).
57//! For now, [`Copy`] is not a supertrait of [`DualNum`] to enable the calculation of derivatives with respect
58//! to a dynamic number of variables. However, in practice, using the [`Copy`] trait bound leads to an
59//! implementation that is more similar to one not using AD and there could be severe performance ramifications
60//! when using dynamically allocated dual numbers.
61//!
62//! The type `X` above is `D` for univariate functions, [`&OVector`](nalgebra::OVector) for multivariate
63//! functions, and `(D, D)` or `(&OVector, &OVector)` for partial derivatives. In the simplest case, the output
64//! `O` is a scalar `D`. However, it is generalized using the [`Mappable`] trait to also include types like
65//! [`Option<D>`] or [`Result<D, E>`], collections like [`Vec<D>`] or [`HashMap<K, D>`], or custom structs that
66//! implement the [`Mappable`] trait. Therefore, it is, e.g., possible to calculate the derivative of a fallible
67//! function:
68//!
69//! ```no_run
70//! # use num_dual::{DualNum, first_derivative};
71//! # type E = ();
72//! fn foo<D: DualNum<f64> + Copy>(x: D) -> Result<D, E> { todo!() }
73//!
74//! fn main() -> Result<(), E> {
75//!     let (val, deriv) = first_derivative(foo, 2.0)?;
76//!     // ...
77//!     Ok(())
78//! }
79//! ```
80//! All dual number types can contain other dual numbers as inner types. Therefore, it is also possible to
81//! use the different derivative functions inside of each other.
82//!
83//! ## Extra arguments
84//! The [`partial`] and [`partial2`] functions are used to pass additional arguments to the function, e.g.:
85//! ```no_run
86//! # use num_dual::{DualNum, first_derivative, partial};
87//! fn foo<D: DualNum<f64> + Copy>(x: D, args: &(D, D)) -> D { todo!() }
88//!
89//! fn main() {
90//!     let (val, deriv) = first_derivative(partial(foo, &(3.0, 4.0)), 5.0);
91//! }
92//! ```
93//! All types that implement the [`DualStruct`] trait can be used as additional function arguments. The
94//! only difference between using the [`partial`] and [`partial2`] functions compared to passing the extra
95//! arguments via a closure, is that the type of the extra arguments is automatically adjusted to the correct
96//! dual number type used for the automatic differentiation. Note that the following code would not compile:
97//! ```compile_fail
98//! # use num_dual::{DualNum, first_derivative};
99//! # fn foo<D: DualNum<f64> + Copy>(x: D, args: &(D, D)) -> D { todo!() }
100//! fn main() {
101//!     let (val, deriv) = first_derivative(|x| foo(x, &(3.0, 4.0)), 5.0);
102//! }
103//! ```
104//! The code created by [`partial`] essentially translates to:
105//! ```no_run
106//! # use num_dual::{DualNum, first_derivative, Dual, DualStruct};
107//! # fn foo<D: DualNum<f64> + Copy>(x: D, args: &(D, D)) -> D { todo!() }
108//! fn main() {
109//!     let (val, deriv) = first_derivative(|x| foo(x, &(Dual::from_inner(&3.0), Dual::from_inner(&4.0))), 5.0);
110//! }
111//! ```
112//!
113//! ## The [`Gradients`] trait
114//! The functions [`gradient`], [`hessian`], [`partial_hessian`] and [`jacobian`] are generic over the dimensionality
115//! of the variable vector. However, to use the functions in a generic context requires not using the [`Copy`] trait
116//! bound on the dual number type, because the dynamically sized dual numbers can by construction not implement
117//! [`Copy`]. Also, due to frequent heap allocations, the performance of the automatic differentiation could
118//! suffer significantly for dynamically sized dual numbers compared to statically sized dual numbers. The
119//! [`Gradients`] trait is introduced to overcome these limitations.
120//! ```
121//! # use num_dual::{DualNum, Gradients};
122//! # use nalgebra::{OVector, DefaultAllocator, allocator::Allocator, vector, dvector};
123//! # use approx::assert_relative_eq;
124//! fn foo<D: DualNum<f64> + Copy, N: Gradients>(x: OVector<D, N>, n: &D) -> D where DefaultAllocator: Allocator<N> {
125//!     x.dot(&x).sqrt() - n
126//! }
127//!
128//! fn main() {
129//!     let x = vector![1.0, 5.0, 5.0, 7.0];
130//!     let (f, grad) = Gradients::gradient(foo, &x, &10.0);
131//!     assert_eq!(f, 0.0);
132//!     assert_relative_eq!(grad, vector![0.1, 0.5, 0.5, 0.7]);
133//!
134//!     let x = dvector![1.0, 5.0, 5.0, 7.0];
135//!     let (f, grad) = Gradients::gradient(foo, &x, &10.0);
136//!     assert_eq!(f, 0.0);
137//!     assert_relative_eq!(grad, dvector![0.1, 0.5, 0.5, 0.7]);
138//! }
139//! ```
140//! For dynamically sized input arrays, the [`Gradients`] trait evaluates gradients or higher-order derivatives
141//! by iteratively evaluating scalar derivatives. For functions that do not rely on the [`Copy`] trait bound,
142//! only benchmarking can reveal Whether the increased performance through the avoidance of heap allocations
143//! can overcome the overhead of repeated function evaluations, i.e., if [`Gradients`] outperforms directly
144//! calling [`gradient`], [`hessian`], [`partial_hessian`] or [`jacobian`].
145//!
146//! # Derivatives of implicit functions
147//! Implicit differentiation is used to determine the derivative `dy/dx` where the output `y` is only related
148//! implicitly to the input `x` via the equation `f(x,y)=0`. Automatic implicit differentiation generalizes the
149//! idea to determining the output `y` with full derivative information. Note that the first step in calculating
150//! an implicit derivative is always determining the "real" part (i.e., neglecting all derivatives) of the equation
151//! `f(x,y)=0`. The `num-dual` library is focused on automatic differentiation and not nonlinear equation
152//! solving. Therefore, this first step needs to be done with your own custom solutions, or Rust crates for
153//! nonlinear equation solving and optimization like, e.g., [argmin](https://argmin-rs.org/).
154//!
155//! The following example implements a square root for generic dual numbers using implicit differentiation. Of
156//! course, the derivatives of the square root can also be determined explicitly using the chain rule, so the
157//! example serves mostly as illustration. `x.re()` provides the "real" part of the dual number which is a [`f64`]
158//! and therefore, we can use all the functionalities from the std library (including the square root).
159//! ```
160//! # use num_dual::{DualNum, implicit_derivative, first_derivative};
161//! fn implicit_sqrt<D: DualNum<f64> + Copy>(x: D) -> D {
162//!     implicit_derivative(|s, x| s * s - x, x.re().sqrt(), &x)
163//! }
164//!
165//! fn main() {
166//!     // sanity check, not actually calculating any derivative
167//!     assert_eq!(implicit_sqrt(25.0), 5.0);
168//!     
169//!     let (sq, deriv) = first_derivative(implicit_sqrt, 25.0);
170//!     assert_eq!(sq, 5.0);
171//!     // The derivative of sqrt(x) is 1/(2*sqrt(x)) which should evaluate to 0.1
172//!     assert_eq!(deriv, 0.1);
173//! }
174//! ```
175//! The `implicit_sqrt` or any likewise defined function is generic over the dual type `D`
176//! and can, therefore, be used anywhere as a part of an arbitrary complex computation. The functions
177//! [`implicit_derivative_binary`] and [`implicit_derivative_vec`] can be used for implicit functions
178//! with more than one variable.
179//!
180//! For implicit functions that contain complex models and a large number of parameters, the [`ImplicitDerivative`]
181//! interface might come in handy. The idea is to define the implicit function using the [`ImplicitFunction`] trait
182//! and feeding it into the [`ImplicitDerivative`] struct, which internally stores the parameters as dual numbers
183//! and their real parts. The [`ImplicitDerivative`] then provides methods for the evaluation of the real part
184//! of the residual (which can be passed to a nonlinear solver) and the implicit derivative which can be called
185//! after solving for the real part of the solution to reconstruct all the derivatives.
186//! ```
187//! # use num_dual::{ImplicitFunction, DualNum, Dual, ImplicitDerivative};
188//! struct ImplicitSqrt;
189//! impl ImplicitFunction<f64> for ImplicitSqrt {
190//!     type Parameters<D> = D;
191//!     type Variable<D> = D;
192//!     fn residual<D: DualNum<f64> + Copy>(x: D, square: &D) -> D {
193//!         *square - x * x
194//!     }
195//! }
196//!
197//! fn main() {
198//!     let x = Dual::from_re(25.0).derivative();
199//!     let func = ImplicitDerivative::new(ImplicitSqrt, x);
200//!     assert_eq!(func.residual(5.0), 0.0);
201//!     assert_eq!(x.sqrt(), func.implicit_derivative(5.0));
202//! }
203//! ```
204//!
205//! ## Combination with nonlinear solver libraries
206//! As mentioned previously, this crate does not contain any algorithms for nonlinear optimization or root finding.
207//! However, combining the capabilities of automatic differentiation with nonlinear solving can be very fruitful.
208//! Most importantly, the calculation of Jacobians or Hessians can be completely automated, if the model can be
209//! expressed within the functionalities of the [`DualNum`] trait. On top of that implicit derivatives can be of
210//! interest, if derivatives of the result of the optimization itself are relevant (e.g., in a bilevel
211//! optimization). The synergy is exploited in the [`ipopt-ad`](https://github.com/prehner/ipopt-ad) crate that
212//! turns the NLP solver [IPOPT](https://github.com/coin-or/Ipopt) into a black-box optimization algorithm (i.e.,
213//! it only requires a function that returns the values of the optimization variable and constraints), without
214//! any repercussions regarding the robustness or speed of convergence of the solver.
215//!
216//! If you are developing nonlinear optimization algorithms in Rust, feel free to reach out to us. We are happy to
217//! discuss how to enhance your algorithms with the automatic differentiation capabilities of this crate.
218
219#![warn(clippy::all)]
220#![warn(clippy::allow_attributes)]
221
222use nalgebra::allocator::Allocator;
223use nalgebra::{DefaultAllocator, Dim, OMatrix, Scalar};
224#[cfg(feature = "ndarray")]
225use ndarray::ScalarOperand;
226use num_traits::{Float, FloatConst, FromPrimitive, Inv, NumAssignOps, NumOps, Signed};
227use std::collections::HashMap;
228use std::fmt;
229use std::hash::Hash;
230use std::iter::{Product, Sum};
231
232#[macro_use]
233mod macros;
234#[macro_use]
235mod impl_derivatives;
236
237mod bessel;
238mod datatypes;
239mod explicit;
240mod implicit;
241pub use bessel::BesselDual;
242pub use datatypes::derivative::Derivative;
243pub use datatypes::dual::{Dual, Dual32, Dual64};
244pub use datatypes::dual_vec::{
245    DualDVec32, DualDVec64, DualSVec, DualSVec32, DualSVec64, DualVec, DualVec32, DualVec64,
246};
247pub use datatypes::dual2::{Dual2, Dual2_32, Dual2_64};
248pub use datatypes::dual2_vec::{
249    Dual2DVec, Dual2DVec32, Dual2DVec64, Dual2SVec, Dual2SVec32, Dual2SVec64, Dual2Vec, Dual2Vec32,
250    Dual2Vec64,
251};
252pub use datatypes::dual3::{Dual3, Dual3_32, Dual3_64};
253pub use datatypes::hyperdual::{HyperDual, HyperDual32, HyperDual64};
254pub use datatypes::hyperdual_vec::{
255    HyperDualDVec32, HyperDualDVec64, HyperDualSVec32, HyperDualSVec64, HyperDualVec,
256    HyperDualVec32, HyperDualVec64,
257};
258pub use datatypes::hyperhyperdual::{HyperHyperDual, HyperHyperDual32, HyperHyperDual64};
259pub use datatypes::real::Real;
260pub use explicit::{
261    Gradients, first_derivative, gradient, hessian, jacobian, partial, partial_hessian, partial2,
262    partial3, second_derivative, second_partial_derivative, third_derivative,
263    third_partial_derivative, third_partial_derivative_vec, zeroth_derivative,
264};
265pub use implicit::{
266    ImplicitDerivative, ImplicitFunction, implicit_derivative, implicit_derivative_binary,
267    implicit_derivative_sp, implicit_derivative_vec,
268};
269
270pub mod linalg;
271
272#[cfg(feature = "python")]
273pub mod python;
274
275#[cfg(feature = "python_macro")]
276mod python_macro;
277
278/// A generalized (hyper) dual number.
279#[cfg(feature = "ndarray")]
280pub trait DualNum<F>:
281    NumOps
282    + for<'r> NumOps<&'r Self>
283    + Signed
284    + NumOps<F>
285    + NumAssignOps
286    + NumAssignOps<F>
287    + Clone
288    + Inv<Output = Self>
289    + Sum
290    + Product
291    + FromPrimitive
292    + From<F>
293    + DualStruct<Self, F, Real = F>
294    + Mappable<Self>
295    + fmt::Display
296    + PartialOrd
297    + PartialOrd<F>
298    + fmt::Debug
299    + ScalarOperand
300    + 'static
301{
302    /// Highest derivative that can be calculated with this struct
303    const NDERIV: usize;
304
305    /// Reciprocal (inverse) of a number `1/x`
306    fn recip(&self) -> Self;
307
308    /// Power with integer exponent `x^n`
309    fn powi(&self, n: i32) -> Self;
310
311    /// Power with real exponent `x^n`
312    fn powf(&self, n: F) -> Self;
313
314    /// Square root
315    fn sqrt(&self) -> Self;
316
317    /// Cubic root
318    fn cbrt(&self) -> Self;
319
320    /// Exponential `e^x`
321    fn exp(&self) -> Self;
322
323    /// Exponential with base 2 `2^x`
324    fn exp2(&self) -> Self;
325
326    /// Exponential minus 1 `e^x-1`
327    fn exp_m1(&self) -> Self;
328
329    /// Natural logarithm
330    fn ln(&self) -> Self;
331
332    /// Logarithm with arbitrary base
333    fn log(&self, base: F) -> Self;
334
335    /// Logarithm with base 2
336    fn log2(&self) -> Self;
337
338    /// Logarithm with base 10
339    fn log10(&self) -> Self;
340
341    /// Logarithm on x plus one `ln(1+x)`
342    fn ln_1p(&self) -> Self;
343
344    /// Sine
345    fn sin(&self) -> Self;
346
347    /// Cosine
348    fn cos(&self) -> Self;
349
350    /// Tangent
351    fn tan(&self) -> Self;
352
353    /// Calculate sine and cosine simultaneously
354    fn sin_cos(&self) -> (Self, Self);
355
356    /// Arcsine
357    fn asin(&self) -> Self;
358
359    /// Arccosine
360    fn acos(&self) -> Self;
361
362    /// Arctangent
363    fn atan(&self) -> Self;
364
365    /// Arctangent
366    fn atan2(&self, other: Self) -> Self;
367
368    /// Hyperbolic sine
369    fn sinh(&self) -> Self;
370
371    /// Hyperbolic cosine
372    fn cosh(&self) -> Self;
373
374    /// Hyperbolic tangent
375    fn tanh(&self) -> Self;
376
377    /// Area hyperbolic sine
378    fn asinh(&self) -> Self;
379
380    /// Area hyperbolic cosine
381    fn acosh(&self) -> Self;
382
383    /// Area hyperbolic tangent
384    fn atanh(&self) -> Self;
385
386    /// 0th order spherical Bessel function of the first kind
387    fn sph_j0(&self) -> Self;
388
389    /// 1st order spherical Bessel function of the first kind
390    fn sph_j1(&self) -> Self;
391
392    /// 2nd order spherical Bessel function of the first kind
393    fn sph_j2(&self) -> Self;
394
395    /// Fused multiply-add
396    #[inline]
397    fn mul_add(&self, a: Self, b: Self) -> Self {
398        self.clone() * a + b
399    }
400
401    /// Power with dual exponent `x^n`
402    #[inline]
403    fn powd(&self, exp: Self) -> Self {
404        (self.ln() * exp).exp()
405    }
406}
407
408/// A generalized (hyper) dual number.
409#[cfg(not(feature = "ndarray"))]
410pub trait DualNum<F>:
411    NumOps
412    + for<'r> NumOps<&'r Self>
413    + Signed
414    + NumOps<F>
415    + NumAssignOps
416    + NumAssignOps<F>
417    + Clone
418    + Inv<Output = Self>
419    + Sum
420    + Product
421    + FromPrimitive
422    + From<F>
423    + DualStruct<Self, F, Real = F>
424    + Mappable<Self>
425    + fmt::Display
426    + PartialOrd
427    + PartialOrd<F>
428    + fmt::Debug
429    + 'static
430{
431    /// Highest derivative that can be calculated with this struct
432    const NDERIV: usize;
433
434    /// Reciprocal (inverse) of a number `1/x`
435    fn recip(&self) -> Self;
436
437    /// Power with integer exponent `x^n`
438    fn powi(&self, n: i32) -> Self;
439
440    /// Power with real exponent `x^n`
441    fn powf(&self, n: F) -> Self;
442
443    /// Square root
444    fn sqrt(&self) -> Self;
445
446    /// Cubic root
447    fn cbrt(&self) -> Self;
448
449    /// Exponential `e^x`
450    fn exp(&self) -> Self;
451
452    /// Exponential with base 2 `2^x`
453    fn exp2(&self) -> Self;
454
455    /// Exponential minus 1 `e^x-1`
456    fn exp_m1(&self) -> Self;
457
458    /// Natural logarithm
459    fn ln(&self) -> Self;
460
461    /// Logarithm with arbitrary base
462    fn log(&self, base: F) -> Self;
463
464    /// Logarithm with base 2
465    fn log2(&self) -> Self;
466
467    /// Logarithm with base 10
468    fn log10(&self) -> Self;
469
470    /// Logarithm on x plus one `ln(1+x)`
471    fn ln_1p(&self) -> Self;
472
473    /// Sine
474    fn sin(&self) -> Self;
475
476    /// Cosine
477    fn cos(&self) -> Self;
478
479    /// Tangent
480    fn tan(&self) -> Self;
481
482    /// Calculate sine and cosine simultaneously
483    fn sin_cos(&self) -> (Self, Self);
484
485    /// Arcsine
486    fn asin(&self) -> Self;
487
488    /// Arccosine
489    fn acos(&self) -> Self;
490
491    /// Arctangent
492    fn atan(&self) -> Self;
493
494    /// Arctangent
495    fn atan2(&self, other: Self) -> Self;
496
497    /// Hyperbolic sine
498    fn sinh(&self) -> Self;
499
500    /// Hyperbolic cosine
501    fn cosh(&self) -> Self;
502
503    /// Hyperbolic tangent
504    fn tanh(&self) -> Self;
505
506    /// Area hyperbolic sine
507    fn asinh(&self) -> Self;
508
509    /// Area hyperbolic cosine
510    fn acosh(&self) -> Self;
511
512    /// Area hyperbolic tangent
513    fn atanh(&self) -> Self;
514
515    /// 0th order spherical Bessel function of the first kind
516    fn sph_j0(&self) -> Self;
517
518    /// 1st order spherical Bessel function of the first kind
519    fn sph_j1(&self) -> Self;
520
521    /// 2nd order spherical Bessel function of the first kind
522    fn sph_j2(&self) -> Self;
523
524    /// Fused multiply-add
525    #[inline]
526    fn mul_add(&self, a: Self, b: Self) -> Self {
527        self.clone() * a + b
528    }
529
530    /// Power with dual exponent `x^n`
531    #[inline]
532    fn powd(&self, exp: Self) -> Self {
533        (self.ln() * exp).exp()
534    }
535}
536
537/// The underlying data type of individual derivatives. Usually f32 or f64.
538pub trait DualNumFloat:
539    Float + FloatConst + FromPrimitive + Signed + fmt::Display + fmt::Debug + Sync + Send + 'static
540{
541}
542impl<T> DualNumFloat for T where
543    T: Float
544        + FloatConst
545        + FromPrimitive
546        + Signed
547        + fmt::Display
548        + fmt::Debug
549        + Sync
550        + Send
551        + 'static
552{
553}
554
555macro_rules! impl_dual_num_float {
556    ($float:ty) => {
557        impl DualNum<$float> for $float {
558            const NDERIV: usize = 0;
559
560            fn mul_add(&self, a: Self, b: Self) -> Self {
561                <$float>::mul_add(*self, a, b)
562            }
563            fn recip(&self) -> Self {
564                <$float>::recip(*self)
565            }
566            fn powi(&self, n: i32) -> Self {
567                <$float>::powi(*self, n)
568            }
569            fn powf(&self, n: Self) -> Self {
570                <$float>::powf(*self, n)
571            }
572            fn powd(&self, n: Self) -> Self {
573                <$float>::powf(*self, n)
574            }
575            fn sqrt(&self) -> Self {
576                <$float>::sqrt(*self)
577            }
578            fn exp(&self) -> Self {
579                <$float>::exp(*self)
580            }
581            fn exp2(&self) -> Self {
582                <$float>::exp2(*self)
583            }
584            fn ln(&self) -> Self {
585                <$float>::ln(*self)
586            }
587            fn log(&self, base: Self) -> Self {
588                <$float>::log(*self, base)
589            }
590            fn log2(&self) -> Self {
591                <$float>::log2(*self)
592            }
593            fn log10(&self) -> Self {
594                <$float>::log10(*self)
595            }
596            fn cbrt(&self) -> Self {
597                <$float>::cbrt(*self)
598            }
599            fn sin(&self) -> Self {
600                <$float>::sin(*self)
601            }
602            fn cos(&self) -> Self {
603                <$float>::cos(*self)
604            }
605            fn tan(&self) -> Self {
606                <$float>::tan(*self)
607            }
608            fn asin(&self) -> Self {
609                <$float>::asin(*self)
610            }
611            fn acos(&self) -> Self {
612                <$float>::acos(*self)
613            }
614            fn atan(&self) -> Self {
615                <$float>::atan(*self)
616            }
617            fn atan2(&self, other: $float) -> Self {
618                <$float>::atan2(*self, other)
619            }
620            fn sin_cos(&self) -> (Self, Self) {
621                <$float>::sin_cos(*self)
622            }
623            fn exp_m1(&self) -> Self {
624                <$float>::exp_m1(*self)
625            }
626            fn ln_1p(&self) -> Self {
627                <$float>::ln_1p(*self)
628            }
629            fn sinh(&self) -> Self {
630                <$float>::sinh(*self)
631            }
632            fn cosh(&self) -> Self {
633                <$float>::cosh(*self)
634            }
635            fn tanh(&self) -> Self {
636                <$float>::tanh(*self)
637            }
638            fn asinh(&self) -> Self {
639                <$float>::asinh(*self)
640            }
641            fn acosh(&self) -> Self {
642                <$float>::acosh(*self)
643            }
644            fn atanh(&self) -> Self {
645                <$float>::atanh(*self)
646            }
647            fn sph_j0(&self) -> Self {
648                if self.abs() < <$float>::EPSILON {
649                    1.0 - self * self / 6.0
650                } else {
651                    self.sin() / self
652                }
653            }
654            fn sph_j1(&self) -> Self {
655                if self.abs() < <$float>::EPSILON {
656                    self / 3.0
657                } else {
658                    let sc = self.sin_cos();
659                    let rec = self.recip();
660                    (sc.0 * rec - sc.1) * rec
661                }
662            }
663            fn sph_j2(&self) -> Self {
664                if self.abs() < <$float>::EPSILON {
665                    self * self / 15.0
666                } else {
667                    let sc = self.sin_cos();
668                    let s2 = self * self;
669                    ((3.0 - s2) * sc.0 - 3.0 * self * sc.1) / (self * s2)
670                }
671            }
672        }
673    };
674}
675
676impl_dual_num_float!(f32);
677impl_dual_num_float!(f64);
678
679/// A struct that contains dual numbers. Needed for arbitrary arguments in [ImplicitFunction].
680///
681/// The trait is implemented for all dual types themselves, and common data types (tuple, vec,
682/// array, ...) and can be implemented for custom data types to achieve full flexibility.
683pub trait DualStruct<D, F> {
684    type Real;
685    type Inner;
686    fn re(&self) -> Self::Real;
687    fn from_inner(inner: &Self::Inner) -> Self;
688}
689
690/// Trait for structs used as an output of functions for which derivatives are calculated.
691///
692/// The main intention is to generalize the calculation of derivatives to fallible functions, but
693/// other use cases might also appear in the future.
694pub trait Mappable<D> {
695    type Output<O>;
696    fn map_dual<M: Fn(D) -> O, O>(self, f: M) -> Self::Output<O>;
697}
698
699impl<D, F> DualStruct<D, F> for () {
700    type Real = ();
701    type Inner = ();
702    fn re(&self) {}
703    fn from_inner(_: &Self::Inner) -> Self {}
704}
705
706impl<D> Mappable<D> for () {
707    type Output<O> = ();
708    fn map_dual<M: FnOnce(D) -> O, O>(self, _: M) {}
709}
710
711impl DualStruct<f32, f32> for f32 {
712    type Real = f32;
713    type Inner = f32;
714    fn re(&self) -> f32 {
715        *self
716    }
717    fn from_inner(inner: &Self::Inner) -> Self {
718        *inner
719    }
720}
721
722impl Mappable<f32> for f32 {
723    type Output<O> = O;
724    fn map_dual<M: FnOnce(f32) -> O, O>(self, f: M) -> Self::Output<O> {
725        f(self)
726    }
727}
728
729impl DualStruct<f64, f64> for f64 {
730    type Real = f64;
731    type Inner = f64;
732    fn re(&self) -> f64 {
733        *self
734    }
735    fn from_inner(inner: &Self::Inner) -> Self {
736        *inner
737    }
738}
739
740impl Mappable<f64> for f64 {
741    type Output<O> = O;
742    fn map_dual<M: FnOnce(f64) -> O, O>(self, f: M) -> Self::Output<O> {
743        f(self)
744    }
745}
746
747impl<D, F, T1: DualStruct<D, F>, T2: DualStruct<D, F>> DualStruct<D, F> for (T1, T2) {
748    type Real = (T1::Real, T2::Real);
749    type Inner = (T1::Inner, T2::Inner);
750    fn re(&self) -> Self::Real {
751        let (s1, s2) = self;
752        (s1.re(), s2.re())
753    }
754    fn from_inner(re: &Self::Inner) -> Self {
755        let (r1, r2) = re;
756        (T1::from_inner(r1), T2::from_inner(r2))
757    }
758}
759
760impl<D, T1: Mappable<D>, T2: Mappable<D>> Mappable<D> for (T1, T2) {
761    type Output<O> = (T1::Output<O>, T2::Output<O>);
762    fn map_dual<M: Fn(D) -> O, O>(self, f: M) -> Self::Output<O> {
763        let (s1, s2) = self;
764        (s1.map_dual(&f), s2.map_dual(&f))
765    }
766}
767
768impl<D, F, T1: DualStruct<D, F>, T2: DualStruct<D, F>, T3: DualStruct<D, F>> DualStruct<D, F>
769    for (T1, T2, T3)
770{
771    type Real = (T1::Real, T2::Real, T3::Real);
772    type Inner = (T1::Inner, T2::Inner, T3::Inner);
773    fn re(&self) -> Self::Real {
774        let (s1, s2, s3) = self;
775        (s1.re(), s2.re(), s3.re())
776    }
777    fn from_inner(inner: &Self::Inner) -> Self {
778        let (r1, r2, r3) = inner;
779        (T1::from_inner(r1), T2::from_inner(r2), T3::from_inner(r3))
780    }
781}
782
783impl<D, T1: Mappable<D>, T2: Mappable<D>, T3: Mappable<D>> Mappable<D> for (T1, T2, T3) {
784    type Output<O> = (T1::Output<O>, T2::Output<O>, T3::Output<O>);
785    fn map_dual<M: Fn(D) -> O, O>(self, f: M) -> Self::Output<O> {
786        let (s1, s2, s3) = self;
787        (s1.map_dual(&f), s2.map_dual(&f), s3.map_dual(&f))
788    }
789}
790
791impl<D, F, T1: DualStruct<D, F>, T2: DualStruct<D, F>, T3: DualStruct<D, F>, T4: DualStruct<D, F>>
792    DualStruct<D, F> for (T1, T2, T3, T4)
793{
794    type Real = (T1::Real, T2::Real, T3::Real, T4::Real);
795    type Inner = (T1::Inner, T2::Inner, T3::Inner, T4::Inner);
796    fn re(&self) -> Self::Real {
797        let (s1, s2, s3, s4) = self;
798        (s1.re(), s2.re(), s3.re(), s4.re())
799    }
800    fn from_inner(inner: &Self::Inner) -> Self {
801        let (r1, r2, r3, r4) = inner;
802        (
803            T1::from_inner(r1),
804            T2::from_inner(r2),
805            T3::from_inner(r3),
806            T4::from_inner(r4),
807        )
808    }
809}
810
811impl<D, T1: Mappable<D>, T2: Mappable<D>, T3: Mappable<D>, T4: Mappable<D>> Mappable<D>
812    for (T1, T2, T3, T4)
813{
814    type Output<O> = (T1::Output<O>, T2::Output<O>, T3::Output<O>, T4::Output<O>);
815    fn map_dual<M: Fn(D) -> O, O>(self, f: M) -> Self::Output<O> {
816        let (s1, s2, s3, s4) = self;
817        (
818            s1.map_dual(&f),
819            s2.map_dual(&f),
820            s3.map_dual(&f),
821            s4.map_dual(&f),
822        )
823    }
824}
825
826impl<
827    D,
828    F,
829    T1: DualStruct<D, F>,
830    T2: DualStruct<D, F>,
831    T3: DualStruct<D, F>,
832    T4: DualStruct<D, F>,
833    T5: DualStruct<D, F>,
834> DualStruct<D, F> for (T1, T2, T3, T4, T5)
835{
836    type Real = (T1::Real, T2::Real, T3::Real, T4::Real, T5::Real);
837    type Inner = (T1::Inner, T2::Inner, T3::Inner, T4::Inner, T5::Inner);
838    fn re(&self) -> Self::Real {
839        let (s1, s2, s3, s4, s5) = self;
840        (s1.re(), s2.re(), s3.re(), s4.re(), s5.re())
841    }
842    fn from_inner(inner: &Self::Inner) -> Self {
843        let (r1, r2, r3, r4, r5) = inner;
844        (
845            T1::from_inner(r1),
846            T2::from_inner(r2),
847            T3::from_inner(r3),
848            T4::from_inner(r4),
849            T5::from_inner(r5),
850        )
851    }
852}
853
854impl<D, T1: Mappable<D>, T2: Mappable<D>, T3: Mappable<D>, T4: Mappable<D>, T5: Mappable<D>>
855    Mappable<D> for (T1, T2, T3, T4, T5)
856{
857    type Output<O> = (
858        T1::Output<O>,
859        T2::Output<O>,
860        T3::Output<O>,
861        T4::Output<O>,
862        T5::Output<O>,
863    );
864    fn map_dual<M: Fn(D) -> O, O>(self, f: M) -> Self::Output<O> {
865        let (s1, s2, s3, s4, s5) = self;
866        (
867            s1.map_dual(&f),
868            s2.map_dual(&f),
869            s3.map_dual(&f),
870            s4.map_dual(&f),
871            s5.map_dual(&f),
872        )
873    }
874}
875
876impl<D, F, T: DualStruct<D, F>, const N: usize> DualStruct<D, F> for [T; N] {
877    type Real = [T::Real; N];
878    type Inner = [T::Inner; N];
879    fn re(&self) -> Self::Real {
880        self.each_ref().map(|x| x.re())
881    }
882    fn from_inner(re: &Self::Inner) -> Self {
883        re.each_ref().map(T::from_inner)
884    }
885}
886
887impl<D, T: Mappable<D>, const N: usize> Mappable<D> for [T; N] {
888    type Output<O> = [T::Output<O>; N];
889    fn map_dual<M: Fn(D) -> O, O>(self, f: M) -> Self::Output<O> {
890        self.map(|x| x.map_dual(&f))
891    }
892}
893
894impl<D, F, T: DualStruct<D, F>> DualStruct<D, F> for Option<T> {
895    type Real = Option<T::Real>;
896    type Inner = Option<T::Inner>;
897    fn re(&self) -> Self::Real {
898        self.as_ref().map(|x| x.re())
899    }
900    fn from_inner(inner: &Self::Inner) -> Self {
901        inner.as_ref().map(|x| T::from_inner(x))
902    }
903}
904
905impl<D, T: Mappable<D>> Mappable<D> for Option<T> {
906    type Output<O> = Option<T::Output<O>>;
907    fn map_dual<M: Fn(D) -> O, O>(self, f: M) -> Self::Output<O> {
908        self.map(|x| x.map_dual(f))
909    }
910}
911
912impl<D, T: Mappable<D>, E> Mappable<D> for Result<T, E> {
913    type Output<O> = Result<T::Output<O>, E>;
914    fn map_dual<M: Fn(D) -> O, O>(self, f: M) -> Self::Output<O> {
915        self.map(|x| x.map_dual(f))
916    }
917}
918
919impl<D, F, T: DualStruct<D, F>> DualStruct<D, F> for Vec<T> {
920    type Real = Vec<T::Real>;
921    type Inner = Vec<T::Inner>;
922    fn re(&self) -> Self::Real {
923        self.iter().map(|x| x.re()).collect()
924    }
925    fn from_inner(inner: &Self::Inner) -> Self {
926        inner.iter().map(|x| T::from_inner(x)).collect()
927    }
928}
929
930impl<D, T: Mappable<D>> Mappable<D> for Vec<T> {
931    type Output<O> = Vec<T::Output<O>>;
932    fn map_dual<M: Fn(D) -> O, O>(self, f: M) -> Self::Output<O> {
933        self.into_iter().map(|x| x.map_dual(&f)).collect()
934    }
935}
936
937impl<D, F, T: DualStruct<D, F>, K: Clone + Eq + Hash> DualStruct<D, F> for HashMap<K, T> {
938    type Real = HashMap<K, T::Real>;
939    type Inner = HashMap<K, T::Inner>;
940    fn re(&self) -> Self::Real {
941        self.iter().map(|(k, x)| (k.clone(), x.re())).collect()
942    }
943    fn from_inner(inner: &Self::Inner) -> Self {
944        inner
945            .iter()
946            .map(|(k, x)| (k.clone(), T::from_inner(x)))
947            .collect()
948    }
949}
950
951impl<D, T: Mappable<D>, K: Eq + Hash> Mappable<D> for HashMap<K, T> {
952    type Output<O> = HashMap<K, T::Output<O>>;
953    fn map_dual<M: Fn(D) -> O, O>(self, f: M) -> Self::Output<O> {
954        self.into_iter().map(|(k, x)| (k, x.map_dual(&f))).collect()
955    }
956}
957
958impl<D: DualNum<F>, F: DualNumFloat, R: Dim, C: Dim> DualStruct<D, F> for OMatrix<D, R, C>
959where
960    DefaultAllocator: Allocator<R, C>,
961    D::Inner: DualNum<F>,
962{
963    type Real = OMatrix<F, R, C>;
964    type Inner = OMatrix<D::Inner, R, C>;
965    fn re(&self) -> Self::Real {
966        self.map(|x| x.re())
967    }
968    fn from_inner(inner: &Self::Inner) -> Self {
969        inner.map(|x| D::from_inner(&x))
970    }
971}
972
973impl<D: Scalar, R: Dim, C: Dim> Mappable<Self> for OMatrix<D, R, C>
974where
975    DefaultAllocator: Allocator<R, C>,
976{
977    type Output<O> = O;
978    fn map_dual<M: Fn(Self) -> O, O>(self, f: M) -> O {
979        f(self)
980    }
981}
num_dual/lib.rs

num_dual/
lib.rs