internal: fix flakiness of accidentally quadratic test

author: Aleksey Kladov <[email protected]> 2021-04-13 10:49:10 +0100
committer: Aleksey Kladov <[email protected]> 2021-04-13 10:56:24 +0100
commit: 327323ad25d126f6394f26e1442667647022c383 (patch)
tree: 52612ccaa72c77f05997fda81af51e956d94a78d /crates/test_utils
parent: 6081b437cc842f8885c26636bef8af4cbc5483e3 (diff)
2 files changed, 114 insertions, 1 deletions
diff --git a/crates/test_utils/src/assert_linear.rs b/crates/test_utils/src/assert_linear.rs
new file mode 100644
index 000000000..6ecc232e1
--- /dev/null
+++ b/crates/test_utils/src/assert_linear.rs
@@ -0,0 +1,112 @@
+//! Checks that a set of measurements looks like a linear function rather than
+//! like a quadratic function. Algorithm:
+//!
+//! 1. Linearly scale input to be in [0; 1)
+//! 2. Using linear regression, compute the best linear function approximating
+//!    the input.
+//! 3. Compute RMSE and  maximal absolute error.
+//! 4. Check that errors are within tolerances and that the constant term is not
+//!    too negative.
+//!
+//! Ideally, we should use a proper "model selection" to directly compare
+//! quadratic and linear models, but that sounds rather complicated:
+//!
+//!     https://stats.stackexchange.com/questions/21844/selecting-best-model-based-on-linear-quadratic-and-cubic-fit-of-data
+//!
+//! We might get false positives on a VM, but never false negatives. So, if the
+//! first round fails, we repeat the ordeal three more times and fail only if
+//! every time there's a fault.
+use stdx::format_to;
+#[derive(Default)]
+pub struct AssertLinear {
+    rounds: Vec<Round>,
+}
+#[derive(Default)]
+struct Round {
+    samples: Vec<(f64, f64)>,
+    plot: String,
+    linear: bool,
+}
+impl AssertLinear {
+    pub fn next_round(&mut self) -> bool {
+        if let Some(round) = self.rounds.last_mut() {
+            round.finish();
+        }
+        if self.rounds.iter().any(|it| it.linear) || self.rounds.len() == 4 {
+            return false;
+        }
+        self.rounds.push(Round::default());
+        true
+    }
+    pub fn sample(&mut self, x: f64, y: f64) {
+        self.rounds.last_mut().unwrap().samples.push((x, y))
+    }
+}
+impl Drop for AssertLinear {
+    fn drop(&mut self) {
+        assert!(!self.rounds.is_empty());
+        if self.rounds.iter().all(|it| !it.linear) {
+            for round in &self.rounds {
+                eprintln!("\n{}", round.plot);
+            }
+            panic!("Doesn't look linear!")
+        }
+    }
+}
+impl Round {
+    fn finish(&mut self) {
+        let (mut xs, mut ys): (Vec<_>, Vec<_>) = self.samples.iter().copied().unzip();
+        normalize(&mut xs);
+        normalize(&mut ys);
+        let xy = xs.iter().copied().zip(ys.iter().copied());
+        // Linear regression: finding a and b to fit y = a + b*x.
+        let mean_x = mean(&xs);
+        let mean_y = mean(&ys);
+        let b = {
+            let mut num = 0.0;
+            let mut denom = 0.0;
+            for (x, y) in xy.clone() {
+                num += (x - mean_x) * (y - mean_y);
+                denom += (x - mean_x).powi(2);
+            }
+            num / denom
+        };
+        let a = mean_y - b * mean_x;
+        self.plot = format!("y_pred = {:.3} + {:.3} * x\n\nx     y     y_pred\n", a, b);
+        let mut se = 0.0;
+        let mut max_error = 0.0f64;
+        for (x, y) in xy {
+            let y_pred = a + b * x;
+            se += (y - y_pred).powi(2);
+            max_error = max_error.max((y_pred - y).abs());
+            format_to!(self.plot, "{:.3} {:.3} {:.3}\n", x, y, y_pred);
+        }
+        let rmse = (se / xs.len() as f64).sqrt();
+        format_to!(self.plot, "\nrmse = {:.3} max error = {:.3}", rmse, max_error);
+        self.linear = rmse < 0.05 && max_error < 0.1 && a > -0.1;
+        fn normalize(xs: &mut Vec<f64>) {
+            let max = xs.iter().copied().max_by(|a, b| a.partial_cmp(b).unwrap()).unwrap();
+            xs.iter_mut().for_each(|it| *it /= max);
+        }
+        fn mean(xs: &[f64]) -> f64 {
+            xs.iter().copied().sum::<f64>() / (xs.len() as f64)
+        }
+    }
+}
diff --git a/crates/test_utils/src/lib.rs b/crates/test_utils/src/lib.rs
index c5f859790..72466c957 100644
--- a/crates/test_utils/src/lib.rs
+++ b/crates/test_utils/src/lib.rs
@@ -8,6 +8,7 @@
 pub mod bench_fixture;
 mod fixture;
+mod assert_linear;
 use std::{
    convert::{TryFrom, TryInto},
@@ -22,7 +23,7 @@ use text_size::{TextRange, TextSize};
 pub use dissimilar::diff as __diff;
 pub use rustc_hash::FxHashMap;
-pub use crate::fixture::Fixture;
+pub use crate::{assert_linear::AssertLinear, fixture::Fixture};
 pub const CURSOR_MARKER: &str = "$0";
 pub const ESCAPED_CURSOR_MARKER: &str = "\\$0";
author	Aleksey Kladov <[email protected]>	2021-04-13 10:49:10 +0100
committer	Aleksey Kladov <[email protected]>	2021-04-13 10:56:24 +0100
commit	327323ad25d126f6394f26e1442667647022c383 (patch)
tree	52612ccaa72c77f05997fda81af51e956d94a78d /crates/test_utils
parent	6081b437cc842f8885c26636bef8af4cbc5483e3 (diff)

diff --git a/crates/test_utils/src/assert_linear.rs b/crates/test_utils/src/assert_linear.rs new file mode 100644 index 000000000..6ecc232e1 --- /dev/null +++ b/crates/test_utils/src/assert_linear.rs
@@ -0,0 +1,112 @@
		1	//! Checks that a set of measurements looks like a linear function rather than
		2	//! like a quadratic function. Algorithm:
		3	//!
		4	//! 1. Linearly scale input to be in [0; 1)
		5	//! 2. Using linear regression, compute the best linear function approximating
		6	//! the input.
		7	//! 3. Compute RMSE and maximal absolute error.
		8	//! 4. Check that errors are within tolerances and that the constant term is not
		9	//! too negative.
		10	//!
		11	//! Ideally, we should use a proper "model selection" to directly compare
		12	//! quadratic and linear models, but that sounds rather complicated:
		13	//!
		14	//! https://stats.stackexchange.com/questions/21844/selecting-best-model-based-on-linear-quadratic-and-cubic-fit-of-data
		15	//!
		16	//! We might get false positives on a VM, but never false negatives. So, if the
		17	//! first round fails, we repeat the ordeal three more times and fail only if
		18	//! every time there's a fault.
		19	use stdx::format_to;
		20
		21	#[derive(Default)]
		22	pub struct AssertLinear {
		23	rounds: Vec<Round>,
		24	}
		25
		26	#[derive(Default)]
		27	struct Round {
		28	samples: Vec<(f64, f64)>,
		29	plot: String,
		30	linear: bool,
		31	}
		32
		33	impl AssertLinear {
		34	pub fn next_round(&mut self) -> bool {
		35	if let Some(round) = self.rounds.last_mut() {
		36	round.finish();
		37	}
		38	if self.rounds.iter().any(\|it\| it.linear) \|\| self.rounds.len() == 4 {
		39	return false;
		40	}
		41	self.rounds.push(Round::default());
		42	true
		43	}
		44
		45	pub fn sample(&mut self, x: f64, y: f64) {
		46	self.rounds.last_mut().unwrap().samples.push((x, y))
		47	}
		48	}
		49
		50	impl Drop for AssertLinear {
		51	fn drop(&mut self) {
		52	assert!(!self.rounds.is_empty());
		53	if self.rounds.iter().all(\|it\| !it.linear) {
		54	for round in &self.rounds {
		55	eprintln!("\n{}", round.plot);
		56	}
		57	panic!("Doesn't look linear!")
		58	}
		59	}
		60	}
		61
		62	impl Round {
		63	fn finish(&mut self) {
		64	let (mut xs, mut ys): (Vec<_>, Vec<_>) = self.samples.iter().copied().unzip();
		65	normalize(&mut xs);
		66	normalize(&mut ys);
		67	let xy = xs.iter().copied().zip(ys.iter().copied());
		68
		69	// Linear regression: finding a and b to fit y = a + b*x.
		70
		71	let mean_x = mean(&xs);
		72	let mean_y = mean(&ys);
		73
		74	let b = {
		75	let mut num = 0.0;
		76	let mut denom = 0.0;
		77	for (x, y) in xy.clone() {
		78	num += (x - mean_x) * (y - mean_y);
		79	denom += (x - mean_x).powi(2);
		80	}
		81	num / denom
		82	};
		83
		84	let a = mean_y - b * mean_x;
		85
		86	self.plot = format!("y_pred = {:.3} + {:.3} * x\n\nx y y_pred\n", a, b);
		87
		88	let mut se = 0.0;
		89	let mut max_error = 0.0f64;
		90	for (x, y) in xy {
		91	let y_pred = a + b * x;
		92	se += (y - y_pred).powi(2);
		93	max_error = max_error.max((y_pred - y).abs());
		94
		95	format_to!(self.plot, "{:.3} {:.3} {:.3}\n", x, y, y_pred);
		96	}
		97
		98	let rmse = (se / xs.len() as f64).sqrt();
		99	format_to!(self.plot, "\nrmse = {:.3} max error = {:.3}", rmse, max_error);
		100
		101	self.linear = rmse < 0.05 && max_error < 0.1 && a > -0.1;
		102
		103	fn normalize(xs: &mut Vec<f64>) {
		104	let max = xs.iter().copied().max_by(\|a, b\| a.partial_cmp(b).unwrap()).unwrap();
		105	xs.iter_mut().for_each(\|it\| *it /= max);
		106	}
		107
		108	fn mean(xs: &[f64]) -> f64 {
		109	xs.iter().copied().sum::<f64>() / (xs.len() as f64)
		110	}
		111	}
		112	}


diff --git a/crates/test_utils/src/lib.rs b/crates/test_utils/src/lib.rs index c5f859790..72466c957 100644 --- a/crates/test_utils/src/lib.rs +++ b/crates/test_utils/src/lib.rs
@@ -8,6 +8,7 @@
8		8
9	pub mod bench_fixture;	9	pub mod bench_fixture;
10	mod fixture;	10	mod fixture;
		11	mod assert_linear;
11		12
12	use std::{	13	use std::{
13	convert::{TryFrom, TryInto},	14	convert::{TryFrom, TryInto},
@@ -22,7 +23,7 @@ use text_size::{TextRange, TextSize};
22	pub use dissimilar::diff as __diff;	23	pub use dissimilar::diff as __diff;
23	pub use rustc_hash::FxHashMap;	24	pub use rustc_hash::FxHashMap;
24		25
25	pub use crate::fixture::Fixture;	26	pub use crate::{assert_linear::AssertLinear, fixture::Fixture};
26		27
27	pub const CURSOR_MARKER: &str = "$0";	28	pub const CURSOR_MARKER: &str = "$0";
28	pub const ESCAPED_CURSOR_MARKER: &str = "\\$0";	29	pub const ESCAPED_CURSOR_MARKER: &str = "\\$0";