fix: implement batch mode for ADMM solver with validation checks

lachlangrose · lachlangrose · commit 270fbe53df0d · 2026-02-25T14:51:15.000+11:00
diff --git a/loopsolver/admm_solver.py b/loopsolver/admm_solver.py
@@ -35,6 +35,9 @@ def admm_solve(
     nmajor=200,
     linsys_solver_kwargs={},
     linsys_solver="lsmr",
+    batch_size: int = None,
+    batch_fraction: float = None,
+    random_seed: int = None,
 ):
     if A.shape[1] != x0.shape[0]:
         raise ValueError("Number of columns in interpolation matrix does not match x0")
@@ -51,6 +54,31 @@ def admm_solve(
     if A.shape[0] != b.shape[0]:
         raise ValueError("Number of rows in interpolation matrix and b are different")
     n_ie = bounds.shape[0]
+    
+    # Setup batch mode
+    use_batch_mode = False
+    n_batch = n_ie
+    rng = None
+    
+    if batch_size is not None and batch_fraction is not None:
+        raise ValueError("Cannot specify both batch_size and batch_fraction")
+    
+    if batch_size is not None:
+        if batch_size < 1 or batch_size > n_ie:
+            raise ValueError(f"batch_size must be between 1 and {n_ie}")
+        n_batch = batch_size
+        use_batch_mode = True
+    elif batch_fraction is not None:
+        if batch_fraction <= 0 or batch_fraction > 1:
+            raise ValueError("batch_fraction must be between 0 and 1")
+        n_batch = max(1, int(n_ie * batch_fraction))
+        use_batch_mode = True
+    
+    if use_batch_mode and random_seed is not None:
+        rng = np.random.RandomState(random_seed)
+    elif use_batch_mode:
+        rng = np.random.RandomState()
+    
     qx_val = np.zeros((Q.shape[0], 1))
     model = np.zeros(A.shape[1])
     model[:] = x0[:]
@@ -71,38 +99,75 @@ def admm_solve(
         if not hasattr(linsys_solver_kwargs[k], '__len__') or len(linsys_solver_kwargs[k]) != nmajor:
             linsys_solver_kwargs[k] = [linsys_solver_kwargs[k]] * nmajor
     for _i in tqdm.tqdm(range(nmajor)):
+        # Sample batch of inequality constraints if batch mode is enabled
+        if use_batch_mode:
+            batch_idx = rng.choice(n_ie, size=n_batch, replace=False)
+            batch_idx = np.sort(batch_idx)  # Sort for consistent sparse matrix operations
+            Q_batch = Q[batch_idx, :]
+            xmin_batch = xmin[batch_idx, :]
+            xmax_batch = xmax[batch_idx, :]
+            matrix = vstack([A, Q_batch])
+            b = np.zeros(A.shape[0] + n_batch)
+            
+            # Create a temporary ADMM object for the batch if needed
+            # This maintains z and u variables only for the sampled constraints
+            admm_batch = ADMM(n_batch)
+            admm_batch.z = admm_method.z[batch_idx].copy()
+            admm_batch.u = admm_method.u[batch_idx].copy()
+        else:
+            batch_idx = None
+            
         # current model value
         Mx = matrix @ model  # np.dot(A, model)
         b[:A_size] = b0[:A_size] - Mx[:A_size]
 
         if Q.shape[0] > 0:
-
-            qx_val[:, 0] = Mx[A_size:,] / admm_weight
-            x0_ADMM = admm_method.admm_method_iterate_admm_array(xmin, xmax, qx_val)
-            # print(x0_ADMM, qx_val.shape)
-            # raise Exception
-            b[A_size:] = -admm_weight * (qx_val[:, 0] - x0_ADMM)
+            if use_batch_mode:
+                qx_val_batch = np.zeros((n_batch, 1))
+                qx_val_batch[:, 0] = Mx[A_size:] / admm_weight
+                x0_ADMM_batch = admm_batch.admm_method_iterate_admm_array(xmin_batch, xmax_batch, qx_val_batch)
+                b[A_size:] = -admm_weight * (qx_val_batch[:, 0] - x0_ADMM_batch)
+                
+                # Update the main ADMM state with the batch results
+                admm_method.z[batch_idx] = admm_batch.z
+                admm_method.u[batch_idx] = admm_batch.u
+            else:
+                qx_val[:, 0] = Mx[A_size:,] / admm_weight
+                x0_ADMM = admm_method.admm_method_iterate_admm_array(xmin, xmax, qx_val)
+                # print(x0_ADMM, qx_val.shape)
+                # raise Exception
+                b[A_size:] = -admm_weight * (qx_val[:, 0] - x0_ADMM)
         # cost_data1 = np.linalg.norm(b[:A_size])
         # cost_data2 = np.linalg.norm(b0[A_size:])
         # model_norm = np.linalg.norm(model)
         if Config.verbose:
-            cost_data = -1.0
-            cost_data_model = 0.0
-            if cost_data2 > 0:
-                cost_data = cost_data1 / cost_data2
-            if model_norm > 0:
-                cost_data_model = cost_data1 / model_norm
-            cost_admm1 = np.linalg.norm(qx_val - admm_method.z)
-            cost_admm2 = np.linalg.norm(admm_method.z)
-            cost_admm = -1.0
-            if cost_admm2 > 0:
-                cost_admm = cost_admm1 / cost_admm2
-            print("----------------------------------------")
-            print(f"it = {_i}")
-            print("cost_data = ", cost_data)
-            print("cost_data_model = ", cost_data_model)
-            print("cost_admm = ", cost_admm)
-            print("----------------------------------------")
+            if use_batch_mode:
+                # In batch mode, compute metrics on the full constraint set
+                Qx_full = Q @ model
+                cost_admm1 = np.linalg.norm(Qx_full / admm_weight - admm_method.z)
+                cost_admm2 = np.linalg.norm(admm_method.z)
+                print("----------------------------------------")
+                print(f"it = {_i} (batch mode: {n_batch}/{n_ie} constraints)")
+                print(f"cost_admm = {cost_admm1 / cost_admm2 if cost_admm2 > 0 else -1.0}")
+                print("----------------------------------------")
+            else:
+                cost_data = -1.0
+                cost_data_model = 0.0
+                # if cost_data2 > 0:
+                #     cost_data = cost_data1 / cost_data2
+                # if model_norm > 0:
+                #     cost_data_model = cost_data1 / model_norm
+                cost_admm1 = np.linalg.norm(qx_val - admm_method.z)
+                cost_admm2 = np.linalg.norm(admm_method.z)
+                cost_admm = -1.0
+                if cost_admm2 > 0:
+                    cost_admm = cost_admm1 / cost_admm2
+                print("----------------------------------------")
+                print(f"it = {_i}")
+                print("cost_data = ", cost_data)
+                print("cost_data_model = ", cost_data_model)
+                print("cost_admm = ", cost_admm)
+                print("----------------------------------------")
         linsys_kwargs = {k:v[_i] for k,v in linsys_solver_kwargs.items()}
         x = lsmr(matrix, b, **linsys_kwargs)
         model += x[0]
diff --git a/tests/test_batch_mode.py b/tests/test_batch_mode.py
@@ -0,0 +1,96 @@
+"""
+Unit tests for ADMM batch mode.
+"""
+import numpy as np
+from scipy.sparse import csr_matrix
+
+from loopsolver import admm_solve
+
+
+def _build_problem(seed=42, n_data=30, n_vars=15, n_ineq=200):
+    rng = np.random.RandomState(seed)
+    A = csr_matrix(rng.randn(n_data, n_vars))
+    x_true = rng.randn(n_vars)
+    b = A @ x_true + 0.1 * rng.randn(n_data)
+
+    Q = csr_matrix(rng.randn(n_ineq, n_vars))
+    Q_x_true = Q @ x_true
+    bounds = np.column_stack([
+        Q_x_true - 0.5,
+        Q_x_true + 0.5,
+    ])
+
+    x0 = np.zeros(n_vars)
+    return A, b, Q, bounds, x0
+
+
+def test_admm_batch_size_runs():
+    A, b, Q, bounds, x0 = _build_problem()
+
+    result = admm_solve(
+        A,
+        b,
+        Q,
+        bounds,
+        x0,
+        admm_weight=0.1,
+        nmajor=10,
+        batch_size=50,
+        random_seed=123,
+        linsys_solver_kwargs={"atol": 1e-6, "btol": 1e-6},
+    )
+
+    assert result.shape == (A.shape[1],)
+    assert np.all(np.isfinite(result))
+
+
+def test_admm_batch_fraction_runs():
+    A, b, Q, bounds, x0 = _build_problem(seed=7)
+
+    result = admm_solve(
+        A,
+        b,
+        Q,
+        bounds,
+        x0,
+        admm_weight=0.1,
+        nmajor=10,
+        batch_fraction=0.25,
+        random_seed=456,
+        linsys_solver_kwargs={"atol": 1e-6, "btol": 1e-6},
+    )
+
+    assert result.shape == (A.shape[1],)
+    assert np.all(np.isfinite(result))
+
+
+def test_admm_batch_mode_matches_full_shape():
+    A, b, Q, bounds, x0 = _build_problem(seed=99)
+
+    full_result = admm_solve(
+        A,
+        b,
+        Q,
+        bounds,
+        x0,
+        admm_weight=0.1,
+        nmajor=5,
+        linsys_solver_kwargs={"atol": 1e-6, "btol": 1e-6},
+    )
+
+    batch_result = admm_solve(
+        A,
+        b,
+        Q,
+        bounds,
+        x0,
+        admm_weight=0.1,
+        nmajor=5,
+        batch_size=40,
+        random_seed=789,
+        linsys_solver_kwargs={"atol": 1e-6, "btol": 1e-6},
+    )
+
+    assert full_result.shape == batch_result.shape
+    assert np.all(np.isfinite(full_result))
+    assert np.all(np.isfinite(batch_result))