Smoothing (#17)

2023-05-01 12:20:05 +01:00
parent 6dbd89aaac
commit bbbacd421b
4 changed files with 136 additions and 15 deletions
--- a/little_learner/src/auto_diff.rs
+++ b/little_learner/src/auto_diff.rs
@@ -461,6 +461,16 @@ impl<A> RankedDifferentiable<A, 1> {
    {
        RankedDifferentiableTagged::of_slice_tagged(input, ())
    }
+
+    pub fn collect(self: RankedDifferentiable<A, 1>) -> Vec<A>
+    where
+        A: Copy,
+    {
+        self.to_vector()
+            .into_iter()
+            .map(|x| *x.to_scalar().real_part())
+            .collect::<Vec<_>>()
+    }
 }

 impl<A, Tag> RankedDifferentiableTagged<A, Tag, 2> {
--- a/little_learner/src/lib.rs
+++ b/little_learner/src/lib.rs
@@ -8,5 +8,6 @@ pub mod expr_syntax_tree;
 pub mod loss;
 pub mod not_nan;
 pub mod scalar;
+pub mod smooth;
 pub mod tensor;
 pub mod traits;
--- a/little_learner/src/smooth.rs
+++ b/little_learner/src/smooth.rs
@@ -0,0 +1,121 @@
+use crate::auto_diff::{Differentiable, DifferentiableTagged};
+use crate::scalar::Scalar;
+use crate::traits::One;
+use std::ops::{Add, Mul, Neg};
+
+pub fn smooth_tagged<A, F, Tag1, Tag2, Tag3>(
+    decay: Scalar<A>,
+    current_avg: &DifferentiableTagged<A, Tag1>,
+    grad: &DifferentiableTagged<A, Tag2>,
+    mut tags: F,
+) -> DifferentiableTagged<A, Tag3>
+where
+    A: One + Clone + Mul<Output = A> + Neg<Output = A> + Add<Output = A>,
+    F: FnMut(Tag1, Tag2) -> Tag3,
+    Tag1: Clone,
+    Tag2: Clone,
+{
+    DifferentiableTagged::map2_tagged(current_avg, grad, &mut |avg, tag1, grad, tag2| {
+        (
+            (avg.clone() * decay.clone()) + (grad.clone() * (Scalar::<A>::one() + -decay.clone())),
+            tags(tag1, tag2),
+        )
+    })
+}
+
+pub fn smooth<A>(
+    decay: Scalar<A>,
+    current_avg: &Differentiable<A>,
+    grad: &Differentiable<A>,
+) -> Differentiable<A>
+where
+    A: One + Clone + Mul<Output = A> + Neg<Output = A> + Add<Output = A>,
+{
+    smooth_tagged(decay, current_avg, grad, |(), ()| ())
+}
+
+#[cfg(test)]
+mod test_smooth {
+    use crate::auto_diff::Differentiable;
+    use crate::scalar::Scalar;
+    use crate::smooth::smooth;
+    use crate::traits::Zero;
+    use ordered_float::NotNan;
+
+    #[test]
+    fn one_dimension() {
+        let decay = Scalar::make(NotNan::new(0.9).expect("not nan"));
+        let smoothed = smooth(
+            decay.clone(),
+            &Differentiable::of_scalar(Scalar::<NotNan<f64>>::zero()),
+            &Differentiable::of_scalar(Scalar::make(NotNan::new(50.3).expect("not nan"))),
+        );
+        assert_eq!(
+            smoothed.into_scalar().real_part().into_inner(),
+            5.0299999999999985
+        );
+
+        let numbers = vec![50.3, 22.7, 4.3, 2.7, 1.8, 2.2, 0.6];
+        let mut output = Vec::with_capacity(numbers.len());
+        let mut acc = Scalar::<NotNan<f64>>::zero();
+        for number in numbers {
+            let number =
+                Differentiable::of_scalar(Scalar::make(NotNan::new(number).expect("not nan")));
+            let next = smooth(decay.clone(), &Differentiable::of_scalar(acc), &number);
+            output.push(next.clone().into_scalar().clone_real_part().into_inner());
+            acc = next.into_scalar();
+        }
+
+        // Note that the original sequence from the book has been heavily affected by rounding.
+        // By zero-indexed element 4, the sequence is different in the first significant digit!
+        assert_eq!(
+            output,
+            vec![
+                5.0299999999999985,
+                6.7969999999999979,
+                6.5472999999999981,
+                6.1625699999999979,
+                5.7263129999999975,
+                5.3736816999999979,
+                4.8963135299999978
+            ]
+        )
+    }
+
+    fn hydrate(v: Vec<f64>) -> Differentiable<NotNan<f64>> {
+        Differentiable::of_vec(
+            v.iter()
+                .cloned()
+                .map(|v| Differentiable::of_scalar(Scalar::make(NotNan::new(v).expect("not nan"))))
+                .collect(),
+        )
+    }
+
+    #[test]
+    fn more_dimension() {
+        let decay = Scalar::make(NotNan::new(0.9).expect("not nan"));
+
+        let inputs = [
+            vec![1.0, 1.1, 3.0],
+            vec![13.4, 18.2, 41.4],
+            vec![1.1, 0.3, 67.3],
+        ]
+        .map(hydrate);
+
+        let mut current = hydrate(vec![0.8, 3.1, 2.2]);
+        let mut output = Vec::with_capacity(inputs.len());
+        for input in inputs {
+            current = smooth(decay.clone(), &current, &input);
+            output.push(current.clone().attach_rank::<1>().unwrap().collect());
+        }
+
+        assert_eq!(
+            output,
+            vec![
+                vec![0.82000000000000006, 2.9, 2.2800000000000002],
+                vec![2.0779999999999998, 4.4299999999999997, 6.1919999999999993],
+                vec![1.9802, 4.0169999999999995, 12.302799999999998]
+            ]
+        )
+    }
+}
--- a/little_learner_app/src/main.rs
+++ b/little_learner_app/src/main.rs
@@ -176,17 +176,6 @@ where
    out.map(&mut predictor.deflate)
 }

-fn collect_vec<T>(input: RankedDifferentiable<NotNan<T>, 1>) -> Vec<T>
-where
-    T: Copy,
-{
-    input
-        .to_vector()
-        .into_iter()
-        .map(|x| x.to_scalar().real_part().into_inner())
-        .collect::<Vec<_>>()
-}
-
 fn main() {
    let plane_xs = [
        [1.0, 2.05],
@@ -228,7 +217,7 @@ fn main() {
    let theta0 = theta0.attach_rank::<1>().expect("rank 1 tensor");
    let theta1 = theta1.attach_rank::<0>().expect("rank 0 tensor");

-    assert_eq!(collect_vec(theta0), [3.979645447136021, 1.976454920954754]);
+    assert_eq!(theta0.collect(), [3.979645447136021, 1.976454920954754]);
    assert_eq!(
        theta1.to_scalar().real_part().into_inner(),
        6.169579045974949
@@ -366,7 +355,7 @@ mod tests {
        let theta0 = theta0.attach_rank::<1>().expect("rank 1 tensor");
        let theta1 = theta1.attach_rank::<0>().expect("rank 0 tensor");

-        assert_eq!(collect_vec(theta0), [3.97757644609063, 2.0496557321494446]);
+        assert_eq!(theta0.collect(), [3.97757644609063, 2.0496557321494446]);
        assert_eq!(
            theta1.to_scalar().real_part().into_inner(),
            5.786758464448078
@@ -404,7 +393,7 @@ mod tests {

        let [theta0, theta1] = iterated;

-        let theta0 = collect_vec(theta0.attach_rank::<1>().expect("rank 1 tensor"));
+        let theta0 = theta0.attach_rank::<1>().expect("rank 1 tensor").collect();
        let theta1 = theta1
            .attach_rank::<0>()
            .expect("rank 0 tensor")
@@ -472,7 +461,7 @@ mod tests {
        let theta0 = theta0.attach_rank::<1>().expect("rank 1 tensor");
        let theta1 = theta1.attach_rank::<0>().expect("rank 0 tensor");

-        assert_eq!(collect_vec(theta0), [3.979645447136021, 1.976454920954754]);
+        assert_eq!(theta0.collect(), [3.979645447136021, 1.976454920954754]);
        assert_eq!(
            theta1.to_scalar().real_part().into_inner(),
            6.169579045974949