From aafe360e40349031befe3c626fc8bb359dba5545 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Juli=C3=A1n=20D=2E=20Ot=C3=A1lvaro?=
 <juliandavid347@gmail.com>
Date: Fri, 17 Oct 2025 12:35:30 -0400
Subject: [PATCH 1/3] add the checkbig convergence criteria

---
 src/algorithms/npag.rs | 76 ++++++++++++++++++++++++++++++++++++++++--
 1 file changed, 74 insertions(+), 2 deletions(-)
diff --git a/src/algorithms/npag.rs b/src/algorithms/npag.rs
index 332eef50e..77e3ba059 100644
--- a/src/algorithms/npag.rs
+++ b/src/algorithms/npag.rs
@@ -28,12 +28,54 @@ const THETA_G: f64 = 1e-4; // Objective function convergence criteria
 const THETA_F: f64 = 1e-2;
 const THETA_D: f64 = 1e-4;
 
+/// Calculate CHECKBIG convergence metric as in Fortran NPAGFULLA
+/// 
+/// Returns the median of relative parameter changes across all support points.
+/// This is calculated as: median(abs((theta_new - theta_old) / theta_old))
+/// 
+/// Used by Fortran as an alternative convergence criterion focusing on parameter stability
+/// rather than objective function improvement.
+fn calculate_checkbig(theta_old: &Theta, theta_new: &Theta) -> f64 {
+    let mut changes = Vec::new();
+    let old_mat = theta_old.matrix();
+    let new_mat = theta_new.matrix();
+    
+    // Calculate relative change for each parameter in each support point
+    for row in 0..old_mat.nrows() {
+        for col in 0..old_mat.ncols() {
+            let old_val = old_mat.get(row, col);
+            let new_val = new_mat.get(row, col);
+            
+            // Avoid division by zero for very small values
+            if old_val.abs() > 1e-10 {
+                let rel_change = ((new_val - old_val) / old_val).abs();
+                changes.push(rel_change);
+            }
+        }
+    }
+    
+    if changes.is_empty() {
+        return 0.0;
+    }
+    
+    // Calculate median
+    changes.sort_by(|a, b| a.partial_cmp(b).unwrap());
+    let mid = changes.len() / 2;
+    
+    if changes.len() % 2 == 0 {
+        (changes[mid - 1] + changes[mid]) / 2.0
+    } else {
+        changes[mid]
+    }
+}
+
 #[derive(Debug)]
 pub struct NPAG<E: Equation> {
     equation: E,
     ranges: Vec<(f64, f64)>,
     psi: Psi,
     theta: Theta,
+    theta_old: Option<Theta>,  // Store previous theta for CHECKBIG calculation
     lambda: Weights,
     w: Weights,
     eps: f64,
@@ -58,6 +100,7 @@ impl<E: Equation> Algorithms<E> for NPAG<E> {
             ranges: settings.parameters().ranges(),
             psi: Psi::new(),
             theta: Theta::new(),
+            theta_old: None,  // Initialize as None (no previous theta yet)
             lambda: Weights::default(),
             w: Weights::default(),
             eps: 0.2,
@@ -139,8 +182,34 @@ impl<E: Equation> Algorithms<E> for NPAG<E> {
             if self.eps <= THETA_E {
                 let pyl = psi * w.weights();
                 self.f1 = pyl.iter().map(|x| x.ln()).sum();
-                if (self.f1 - self.f0).abs() <= THETA_F {
-                    tracing::info!("The model converged after {} cycles", self.cycle,);
+                
+                // Calculate CHECKBIG if we have a previous theta
+                let checkbig = if let Some(ref old_theta) = self.theta_old {
+                    calculate_checkbig(old_theta, &self.theta)
+                } else {
+                    f64::MAX  // First cycle, no previous theta
+                };
+                
+                let f1_f0_diff = (self.f1 - self.f0).abs();
+                
+                // Log both convergence metrics for diagnostics
+                tracing::info!(
+                    "Cycle {}: f1-f0={:.6e} (threshold={:.6e}), CHECKBIG={:.6e} (threshold={:.6e})",
+                    self.cycle,
+                    f1_f0_diff,
+                    THETA_F,
+                    checkbig,
+                    THETA_E
+                );
+                
+                // Use f1-f0 as convergence criterion (standard approach)
+                if f1_f0_diff <= THETA_F {
+                    tracing::info!(
+                        "The model converged after {} cycles (f1-f0={:.6e} < THETA_F={:.6e})",
+                        self.cycle,
+                        f1_f0_diff,
+                        THETA_F
+                    );
                     self.converged = true;
                     self.status = Status::Converged;
                 } else {
@@ -149,6 +218,9 @@ impl<E: Equation> Algorithms<E> for NPAG<E> {
                 }
             }
         }
+        
+        // Save current theta for next cycle's CHECKBIG calculation
+        self.theta_old = Some(self.theta.clone());
 
         // Stop if we have reached maximum number of cycles
         if self.cycle >= self.settings.config().cycles {

From 7f8c5f3fbac6e205a5eae1fca0160c04db60aa14 Mon Sep 17 00:00:00 2001
From: Markus <66058642+mhovd@users.noreply.github.com>
Date: Thu, 23 Oct 2025 10:41:48 +0200
Subject: [PATCH 2/3] Cargo fmt

---
 src/algorithms/npag.rs | 30 +++++++++++++++---------------
 1 file changed, 15 insertions(+), 15 deletions(-)

diff --git a/src/algorithms/npag.rs b/src/algorithms/npag.rs
index 77e3ba059..3deac9707 100644
--- a/src/algorithms/npag.rs
+++ b/src/algorithms/npag.rs
@@ -29,23 +29,23 @@ const THETA_F: f64 = 1e-2;
 const THETA_D: f64 = 1e-4;
 
 /// Calculate CHECKBIG convergence metric as in Fortran NPAGFULLA
-/// 
+///
 /// Returns the median of relative parameter changes across all support points.
 /// This is calculated as: median(abs((theta_new - theta_old) / theta_old))
-/// 
+///
 /// Used by Fortran as an alternative convergence criterion focusing on parameter stability
 /// rather than objective function improvement.
 fn calculate_checkbig(theta_old: &Theta, theta_new: &Theta) -> f64 {
     let mut changes = Vec::new();
     let old_mat = theta_old.matrix();
     let new_mat = theta_new.matrix();
-    
+
     // Calculate relative change for each parameter in each support point
     for row in 0..old_mat.nrows() {
         for col in 0..old_mat.ncols() {
             let old_val = old_mat.get(row, col);
             let new_val = new_mat.get(row, col);
-            
+
             // Avoid division by zero for very small values
             if old_val.abs() > 1e-10 {
                 let rel_change = ((new_val - old_val) / old_val).abs();
@@ -53,15 +53,15 @@ fn calculate_checkbig(theta_old: &Theta, theta_new: &Theta) -> f64 {
             }
         }
     }
-    
+
     if changes.is_empty() {
         return 0.0;
     }
-    
+
     // Calculate median
     changes.sort_by(|a, b| a.partial_cmp(b).unwrap());
     let mid = changes.len() / 2;
-    
+
     if changes.len() % 2 == 0 {
         (changes[mid - 1] + changes[mid]) / 2.0
     } else {
@@ -75,7 +75,7 @@ pub struct NPAG<E: Equation> {
     ranges: Vec<(f64, f64)>,
     psi: Psi,
     theta: Theta,
-    theta_old: Option<Theta>,  // Store previous theta for CHECKBIG calculation
+    theta_old: Option<Theta>, // Store previous theta for CHECKBIG calculation
     lambda: Weights,
     w: Weights,
     eps: f64,
@@ -100,7 +100,7 @@ impl<E: Equation> Algorithms<E> for NPAG<E> {
             ranges: settings.parameters().ranges(),
             psi: Psi::new(),
             theta: Theta::new(),
-            theta_old: None,  // Initialize as None (no previous theta yet)
+            theta_old: None, // Initialize as None (no previous theta yet)
             lambda: Weights::default(),
             w: Weights::default(),
             eps: 0.2,
@@ -182,16 +182,16 @@ impl<E: Equation> Algorithms<E> for NPAG<E> {
             if self.eps <= THETA_E {
                 let pyl = psi * w.weights();
                 self.f1 = pyl.iter().map(|x| x.ln()).sum();
-                
+
                 // Calculate CHECKBIG if we have a previous theta
                 let checkbig = if let Some(ref old_theta) = self.theta_old {
                     calculate_checkbig(old_theta, &self.theta)
                 } else {
-                    f64::MAX  // First cycle, no previous theta
+                    f64::MAX // First cycle, no previous theta
                 };
-                
+
                 let f1_f0_diff = (self.f1 - self.f0).abs();
-                
+
                 // Log both convergence metrics for diagnostics
                 tracing::info!(
                     "Cycle {}: f1-f0={:.6e} (threshold={:.6e}), CHECKBIG={:.6e} (threshold={:.6e})",
@@ -201,7 +201,7 @@ impl<E: Equation> Algorithms<E> for NPAG<E> {
                     checkbig,
                     THETA_E
                 );
-                
+
                 // Use f1-f0 as convergence criterion (standard approach)
                 if f1_f0_diff <= THETA_F {
                     tracing::info!(
@@ -218,7 +218,7 @@ impl<E: Equation> Algorithms<E> for NPAG<E> {
                 }
             }
         }
-        
+
         // Save current theta for next cycle's CHECKBIG calculation
         self.theta_old = Some(self.theta.clone());
 

From 106d10dec8c22d3c6fa9c0928b8f071472e86ad6 Mon Sep 17 00:00:00 2001
From: Markus <markushh@uio.no>
Date: Fri, 7 Nov 2025 22:26:47 +0100
Subject: [PATCH 3/3] Update CHECKBIG calculation and convergence

---
 src/algorithms/npag.rs | 86 +++++++++++++----------------------------
 src/structs/theta.rs   | 88 +++++++++++++++++++++++++++++++++++++++++-
 src/structs/weights.rs | 11 ++++++
 3 files changed, 125 insertions(+), 60 deletions(-)

diff --git a/src/algorithms/npag.rs b/src/algorithms/npag.rs
index 4ddf15e13..2e54720d9 100644
--- a/src/algorithms/npag.rs
+++ b/src/algorithms/npag.rs
@@ -28,47 +28,6 @@ const THETA_G: f64 = 1e-4; // Objective function convergence criteria
 const THETA_F: f64 = 1e-2;
 const THETA_D: f64 = 1e-4;
 
-/// Calculate CHECKBIG convergence metric as in Fortran NPAGFULLA
-///
-/// Returns the median of relative parameter changes across all support points.
-/// This is calculated as: median(abs((theta_new - theta_old) / theta_old))
-///
-/// Used by Fortran as an alternative convergence criterion focusing on parameter stability
-/// rather than objective function improvement.
-fn calculate_checkbig(theta_old: &Theta, theta_new: &Theta) -> f64 {
-    let mut changes = Vec::new();
-    let old_mat = theta_old.matrix();
-    let new_mat = theta_new.matrix();
-
-    // Calculate relative change for each parameter in each support point
-    for row in 0..old_mat.nrows() {
-        for col in 0..old_mat.ncols() {
-            let old_val = old_mat.get(row, col);
-            let new_val = new_mat.get(row, col);
-
-            // Avoid division by zero for very small values
-            if old_val.abs() > 1e-10 {
-                let rel_change = ((new_val - old_val) / old_val).abs();
-                changes.push(rel_change);
-            }
-        }
-    }
-
-    if changes.is_empty() {
-        return 0.0;
-    }
-
-    // Calculate median
-    changes.sort_by(|a, b| a.partial_cmp(b).unwrap());
-    let mid = changes.len() / 2;
-
-    if changes.len() % 2 == 0 {
-        (changes[mid - 1] + changes[mid]) / 2.0
-    } else {
-        changes[mid]
-    }
-}
-
 #[derive(Debug)]
 pub struct NPAG<E: Equation + Send + 'static> {
     equation: E,
@@ -208,34 +167,43 @@ impl<E: Equation + Send + 'static> Algorithms<E> for NPAG<E> {
 
                 // Calculate CHECKBIG if we have a previous theta
                 let checkbig = if let Some(ref old_theta) = self.theta_old {
-                    calculate_checkbig(old_theta, &self.theta)
+                    Some(self.theta.max_relative_difference(&old_theta)?)
                 } else {
-                    f64::MAX // First cycle, no previous theta
+                    None
                 };
 
                 let f1_f0_diff = (self.f1 - self.f0).abs();
 
-                // Log both convergence metrics for diagnostics
-                tracing::info!(
-                    "Cycle {}: f1-f0={:.6e} (threshold={:.6e}), CHECKBIG={:.6e} (threshold={:.6e})",
-                    self.cycle,
-                    f1_f0_diff,
-                    THETA_F,
-                    checkbig,
-                    THETA_E
-                );
-
-                // Use f1-f0 as convergence criterion (standard approach)
-                if f1_f0_diff <= THETA_F {
-                    tracing::info!(
-                        "The model converged after {} cycles (f1-f0={:.6e} < THETA_F={:.6e})",
-                        self.cycle,
+                // Log convergence metrics for diagnostics
+                match checkbig {
+                    Some(cb) => tracing::debug!(
+                        "f1-f0={:.6e} (threshold={:.6e}), CHECKBIG={:.6e} (threshold={:.6e})",
+                        f1_f0_diff,
+                        THETA_F,
+                        cb,
+                        THETA_E
+                    ),
+                    None => tracing::debug!(
+                        "f1-f0={:.6e} (threshold={:.6e}), CHECKBIG=N/A (no previous theta)",
                         f1_f0_diff,
                         THETA_F
-                    );
+                    ),
+                }
+
+                // Standard likelihood convergence check
+                if f1_f0_diff <= THETA_F {
+                    tracing::info!("The model converged according to the LIKELIHOOD criteria",);
                     self.set_status(Status::Stop(StopReason::Converged));
                     self.log_cycle_state();
                     return Ok(self.status().clone());
+                } else if let Some(cb) = checkbig {
+                    // Additional CHECKBIG convergence check
+                    if cb <= THETA_E {
+                        tracing::info!("The model converged according to the CHECKBIG criteria",);
+                        self.set_status(Status::Stop(StopReason::Converged));
+                        self.log_cycle_state();
+                        return Ok(self.status().clone());
+                    }
                 } else {
                     self.f0 = self.f1;
                     self.eps = 0.2;
diff --git a/src/structs/theta.rs b/src/structs/theta.rs
index b03a873b6..88d59e674 100644
--- a/src/structs/theta.rs
+++ b/src/structs/theta.rs
@@ -1,7 +1,7 @@
 use std::fmt::Debug;
 
 use anyhow::{bail, Result};
-use faer::Mat;
+use faer::{ColRef, Mat};
 use serde::{Deserialize, Serialize};
 
 use crate::prelude::Parameters;
@@ -201,6 +201,41 @@ impl Theta {
 
         Theta::from_parts(mat, parameters)
     }
+
+    /// Compute the maximum relative difference in medians across parameters between two Thetas
+    ///
+    /// This is useful for assessing convergence between iterations
+    /// # Errors
+    /// Returns an error if the number of parameters (columns) do not match between the two Thetas
+    pub fn max_relative_difference(&self, other: &Theta) -> Result<f64> {
+        if self.matrix.ncols() != other.matrix.ncols() {
+            bail!("Number of parameters (columns) do not match between Thetas");
+        }
+
+        fn median_col(col: ColRef<f64>) -> f64 {
+            let mut vals: Vec<&f64> = col.iter().collect();
+            vals.sort_by(|a, b| a.partial_cmp(b).unwrap());
+            let mid = vals.len() / 2;
+            if vals.len() % 2 == 0 {
+                (vals[mid - 1] + vals[mid]) / 2.0
+            } else {
+                *vals[mid]
+            }
+        }
+
+        let mut max_rel_diff = 0.0;
+        for i in 0..self.matrix.ncols() {
+            let current_median = median_col(self.matrix.col(i));
+            let other_median = median_col(other.matrix.col(i));
+
+            let denom = current_median.abs().max(other_median.abs()).max(1e-8); // Avoid division by zero
+            let rel_diff = ((current_median - other_median).abs()) / denom;
+            if rel_diff > max_rel_diff {
+                max_rel_diff = rel_diff;
+            }
+        }
+        Ok(max_rel_diff)
+    }
 }
 
 impl Debug for Theta {
@@ -379,4 +414,55 @@ mod tests {
 
         assert_eq!(theta.matrix(), &new_matrix);
     }
+
+    #[test]
+    fn test_max_relative_difference() {
+        let matrix1 = mat![[2.0, 4.0], [6.0, 8.0]];
+        let matrix2 = mat![[2.0, 4.0], [8.0, 8.0]];
+        let parameters = Parameters::new().add("A", 0.0, 10.0).add("B", 0.0, 10.0);
+        let theta1 = Theta::from_parts(matrix1, parameters.clone()).unwrap();
+        let theta2 = Theta::from_parts(matrix2, parameters).unwrap();
+        let max_rel_diff = theta1.max_relative_difference(&theta2).unwrap();
+        println!("Max relative difference: {}", max_rel_diff);
+        assert!((max_rel_diff - 0.2).abs() < 1e-6);
+    }
+
+    #[test]
+    fn test_max_relative_difference_same_theta() {
+        let matrix1 = mat![[1.0, 2.0], [3.0, 4.0]];
+        let parameters = Parameters::new().add("A", 0.0, 10.0).add("B", 0.0, 10.0);
+        let theta1 = Theta::from_parts(matrix1, parameters.clone()).unwrap();
+        let theta2 = theta1.clone();
+        let max_rel_diff = theta1.max_relative_difference(&theta2).unwrap();
+        println!("Max relative difference: {}", max_rel_diff);
+        assert!((max_rel_diff - 0.0).abs() < 1e-6);
+    }
+
+    #[test]
+    fn test_max_relative_difference_shape_error() {
+        let matrix1 = mat![[2.0, 4.0, 6.0], [8.0, 10.0, 12.0]];
+        let matrix2 = mat![[2.0, 4.0], [8.0, 8.0]];
+        let parameters1 = Parameters::new()
+            .add("A", 0.0, 10.0)
+            .add("B", 0.0, 10.0)
+            .add("C", 0.0, 10.0);
+        let parameters2 = Parameters::new().add("A", 0.0, 10.0).add("B", 0.0, 10.0);
+        let theta1 = Theta::from_parts(matrix1, parameters1).unwrap();
+        let theta2 = Theta::from_parts(matrix2, parameters2).unwrap();
+        let result = theta1.max_relative_difference(&theta2);
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn test_max_relative_difference_odd_length() {
+        let matrix1 = mat![[1.0, 2.0], [3.0, 6.0], [5.0, 10.0]];
+        let matrix2 = mat![[1.0, 2.0], [4.0, 6.0], [5.0, 10.0]];
+        let parameters = Parameters::new().add("A", 0.0, 10.0).add("B", 0.0, 10.0);
+        let theta1 = Theta::from_parts(matrix1, parameters.clone()).unwrap();
+        let theta2 = Theta::from_parts(matrix2, parameters).unwrap();
+        let max_rel_diff = theta1.max_relative_difference(&theta2).unwrap();
+        println!("Max relative difference (odd length): {}", max_rel_diff);
+
+        assert!((max_rel_diff - 0.25).abs() < 1e-6);
+    }
 }
diff --git a/src/structs/weights.rs b/src/structs/weights.rs
index e84974443..1f515a94c 100644
--- a/src/structs/weights.rs
+++ b/src/structs/weights.rs
@@ -58,14 +58,25 @@ impl Weights {
         self.weights.nrows()
     }
 
+    /// Check if there are no weights.
+    pub fn is_empty(&self) -> bool {
+        self.weights.nrows() == 0
+    }
+
     /// Get a vector representation of the weights.
     pub fn to_vec(&self) -> Vec<f64> {
         self.weights.iter().cloned().collect()
     }
 
+    /// Get an iterator over the weights.
     pub fn iter(&self) -> impl Iterator<Item = f64> + '_ {
         self.weights.iter().cloned()
     }
+
+    /// Get a mutable iterator over the weights.
+    pub fn iter_mut(&mut self) -> impl Iterator<Item = &mut f64> + '_ {
+        self.weights.iter_mut()
+    }
 }
 
 impl Serialize for Weights {