MortenLohne · 87flowers · Jan 7, 2026 · Jan 11, 2026
diff --git a/src/main.rs b/src/main.rs
@@ -19,8 +19,8 @@ mod engine;
 mod game;
 mod openings;
 mod pgn_writer;
-mod simulation;
 mod sprt;
+mod stats;
 #[cfg(test)]
 mod tests;
 mod tournament;

diff --git a/src/simulation/mod.rs b/src/simulation/mod.rs
diff --git a/src/sprt.rs b/src/sprt.rs
@@ -1,16 +1,10 @@
-use std::convert::TryInto;
+use crate::stats::{PentanomialResult, ResultExt};
+use std::{convert::TryInto, num::FpCategory};
 
 // This is an implementation of GSPRT under a pentanomial model.
-
-#[derive(Clone, Copy, Debug, PartialEq, Eq)]
-pub struct PentanomialResult {
-    pub ww: usize,
-    pub wd: usize,
-    pub wl: usize,
-    pub dd: usize,
-    pub dl: usize,
-    pub ll: usize,
-}
+//
+// References:
+// [1] Michel Van den Bergh, Comments on Normalized Elo, https://www.cantate.be/Fishtest/normalized_elo_practical.pdf
 
 #[derive(Clone, Copy, Debug, PartialEq)]
 pub struct SprtParameters {
@@ -47,51 +41,157 @@ impl SprtParameters {
         (self.elo0, self.elo1)
     }
 
-    // Approximate formula for the log-likelihood ratio for the given pentanomial result.
-    // See section 4.2 of https://archive.org/details/fishtest_mathematics/normalized_elo_practical/
-    // Many thanks to Michel Van den Bergh.
     pub fn llr(self: SprtParameters, penta: PentanomialResult) -> f64 {
-        let (n, mean, variance) = penta.to_mean_and_variance();
-        let sigma = (2.0 * variance).sqrt();
-        let t = (mean - 0.5) / sigma;
-        let a = 1.0 + (t - self.t0).powf(2.0);
-        let b = 1.0 + (t - self.t1).powf(2.0);
-        n * f64::ln(a / b)
+        let count = penta.count() as f64;
+        let pdf: [f64; 5] = penta.probability_distribution().try_into().unwrap();
+        let score: [f64; 5] = PentanomialResult::scores_map().try_into().unwrap();
+        llr(
+            count,
+            pdf,
+            score,
+            self.t0 * f64::sqrt(2.0),
+            self.t1 * f64::sqrt(2.0),
+        )
     }
 }
 
-impl PentanomialResult {
-    pub fn to_pdf(self: PentanomialResult) -> (f64, [f64; 5]) {
-        let penta = [
-            self.ll as f64,
-            self.dl as f64,
-            self.dd as f64 + self.wl as f64,
-            self.wd as f64,
-            self.ww as f64,
-        ];
-        let zeros = penta.iter().filter(|&x| *x == 0.0).count();
-        let regularisation = if zeros > 0 { 2.0 / zeros as f64 } else { 0.0 };
-        let n: f64 = penta.iter().sum();
-        (
-            n,
-            penta
-                .iter()
-                .map(|x| (x + regularisation) / n)
-                .collect::<Vec<_>>()
-                .try_into()
-                .unwrap(),
-        )
-    }
+/// Compute log-likelihood ratio for t = t0 versus t = t1.
+fn llr<const N: usize>(count: f64, pdf: [f64; N], score: [f64; N], t0: f64, t1: f64) -> f64 {
+    let p0 = mle(pdf, score, 0.5, t0);
+    let p1 = mle(pdf, score, 0.5, t1);
+    count * mean(std::array::from_fn(|i| p1[i].ln() - p0[i].ln()), pdf)
+}
+
+/// Compute the maximum likelihood estimate for a discrete
+/// probability distribution that has t = (mu - mu_ref) / sigma,
+/// given `self` is an empirical distribution.
+///
+/// See section 4.1 of [1] for details.
+fn mle<const N: usize>(pdf: [f64; N], score: [f64; N], mu_ref: f64, t_star: f64) -> [f64; N] {
+    const THETA_EPSILON: f64 = 1e-7;
+    const MLE_EPSILON: f64 = 1e-4;
+
+    // This is an iterative method, so we need to start with
+    // an initial value. As suggested in [1], we start with a
+    // uniform distribution.
+    let mut p = [1.0 / N as f64; N];
 
-    pub fn to_mean_and_variance(self: PentanomialResult) -> (f64, f64, f64) {
-        let scores = [0.0, 0.25, 0.5, 0.75, 1.0];
-        let (n, pdf) = self.to_pdf();
-        let mean: f64 = pdf.iter().zip(scores).map(|(p, s)| p * s).sum();
-        let variance: f64 = pdf
+    // Have an upper limit for iteration.
+    for _ in 0..25 {
+        // Store our current estimate away to detect convergence.
+        let prev_p = p;
+
+        // Calculate phi.
+        let (mu, variance) = mean_and_variance(score, p);
+        let phi: [f64; N] = std::array::from_fn(|i| {
+            let a_i = score[i];
+            let sigma = variance.sqrt();
+            a_i - mu_ref - 0.5 * t_star * sigma * (1.0 + ((a_i - mu) / sigma).powi(2))
+        });
+
+        // We need to find a subset of the possible solutions for theta,
+        // so we need to calculate our constraints for theta.
+        let u = phi
             .iter()
-            .zip(scores)
-            .map(|(p, s)| p * (s - mean).powf(2.0))
-            .sum();
-        (n, mean, variance)
+            .min_by(|a, b| a.partial_cmp(b).expect("unexpected NaN"))
+            .unwrap();
+        let v = phi
+            .iter()
+            .max_by(|a, b| a.partial_cmp(b).expect("unexpected NaN"))
+            .unwrap();
+        let min_theta = -1.0 / v;
+        let max_theta = -1.0 / u;
+
+        // Solve equation 4.9 in [1] for theta.
+        let theta = itp(
+            |x: f64| (0..N).map(|i| pdf[i] * phi[i] / (1.0 + x * phi[i])).sum(),
+            (min_theta, max_theta),
+            (f64::INFINITY, -f64::INFINITY),
+            0.1,
+            2.0,
+            0.99,
+            THETA_EPSILON,
+        );
+
+        // Calculate new estimate
+        p = std::array::from_fn(|i| pdf[i] / (1.0 + theta * phi[i]));
+
+        // Good enough?
+        if (0..N).all(|i| (prev_p[i] - p[i]).abs() < MLE_EPSILON) {
+            break;
+        }
+    }
+
+    p
+}
+
+fn mean<const N: usize>(x: [f64; N], p: [f64; N]) -> f64 {
+    (0..N).map(|i| p[i] * x[i]).sum()
+}
+
+fn mean_and_variance<const N: usize>(x: [f64; N], p: [f64; N]) -> (f64, f64) {
+    let mu = mean(x, p);
+    (mu, (0..N).map(|i| p[i] * (x[i] - mu).powi(2)).sum())
+}
+
+// I. F. D. Oliveira and R. H. C. Takahashi. 2020. An Enhancement of the Bisection Method Average Performance
+// Preserving Minmax Optimality. ACM Trans. Math. Softw. 47, 1, Article 5 (March 2021).
+// https://doi.org/10.1145/3423597
+fn itp<F>(
+    f: F,
+    (mut a, mut b): (f64, f64),
+    (mut f_a, mut f_b): (f64, f64),
+    k_1: f64,
+    k_2: f64,
+    n_0: f64,
+    epsilon: f64,
+) -> f64
+where
+    F: Fn(f64) -> f64,
+{
+    if f_a > 0.0 {
+        (a, b) = (b, a);
+        (f_a, f_b) = (f_b, f_a);
+    }
+    assert!(f_a < 0.0 && 0.0 < f_b);
+
+    let n_half = ((b - a).abs() / (2.0 * epsilon)).log2().ceil();
+    let n_max = n_half + n_0;
+    let mut i = 0;
+    while (b - a).abs() > 2.0 * epsilon {
+        let x_half = (a + b) / 2.0;
+        let r = epsilon * f64::powf(2.0, n_max - i as f64) - (b - a) / 2.0;
+        let delta = k_1 * f64::powf(b - a, k_2);
+
+        let x_f = (f_b * a - f_a * b) / (f_b - f_a);
+
+        let sigma = (x_half - x_f) / (x_half - x_f).abs();
+        let x_t = if delta <= (x_half - x_f).abs() {
+            x_f + sigma * delta
+        } else {
+            x_half
+        };
+
+        let x_itp = if (x_t - x_half).abs() <= r {
+            x_t
+        } else {
+            x_half - sigma * r
+        };
+
+        let f_itp = f(x_itp);
+        if f_itp.classify() == FpCategory::Zero {
+            a = x_itp;
+            b = x_itp;
+        } else if f_itp.is_sign_negative() {
+            a = x_itp;
+            f_a = f_itp;
+        } else {
+            b = x_itp;
+            f_b = f_itp;
+        }
+
+        i += 1;
     }
+
+    (a + b) / 2.0
 }