Quantco · jtilly · Nov 8, 2024 · Sep 20, 2024 · Sep 25, 2024 · Sep 23, 2024
@@ -7,13 +7,17 @@
 Changelog
 =========
 
-3.0.3 - unreleased
+3.1.0 - unreleased
 ------------------
 
-**Bug fix:
+**Bug fix:**
 
 - Fixed a bug where :meth:`glum.GeneralizedLinearRegressor.fit` would raise a ``dtype`` mismatch error if fit with ``alpha_search=True``.
 
+**Other changes:**
+
+- Use data type (``float64`` or ``float32``) dependent precision in solvers.
+
 3.0.2 - 2024-06-25
 ------------------
 

@@ -117,7 +117,8 @@ def enet_coordinate_descent_gram(int[::1] active_set,
                                  bint has_lower_bounds,
                                  floating[:] lower_bounds,
                                  bint has_upper_bounds,
-                                 floating[:] upper_bounds):
+                                 floating[:] upper_bounds,
+                                 floating eps):
     """Cython version of the coordinate descent algorithm
         for Elastic-Net regression
         We minimize
@@ -162,7 +163,7 @@ def enet_coordinate_descent_gram(int[::1] active_set,
                 else:
                     P1_ii = P1[ii - intercept]
 
-                if Q[active_set_ii, active_set_ii] == 0.0:
+                if Q[active_set_ii, active_set_ii] <= eps:
                     continue
 
                 w_ii = w[ii]  # Store previous value

@@ -452,7 +452,7 @@ def _one_over_var_inf_to_val(arr: np.ndarray, val: float) -> np.ndarray:
 
     If values are zeros, return val.
     """
-    zeros = np.where(np.abs(arr) < 1e-7)
+    zeros = np.where(np.abs(arr) < np.sqrt(np.finfo(arr.dtype).eps))
     with np.errstate(divide="ignore"):
         one_over = 1 / arr
     one_over[zeros] = val

@@ -70,6 +70,7 @@ def _cd_solver(state, data, active_hessian):
         data._lower_bounds,
         data.has_upper_bounds,
         data._upper_bounds,
+        np.finfo(state.coef.dtype).eps * 16,
     )
     return new_coef - state.coef, n_cycles
 
@@ -759,7 +760,8 @@ def line_search(state: IRLSState, data: IRLSData, d: np.ndarray):
     """
     # line search parameters
     (beta, sigma) = (0.5, 0.0001)
-    eps = 16 * np.finfo(state.obj_val.dtype).eps  # type: ignore
+    # state.obj_val is np.float64, even if coef is np.float32
+    eps = 16 * np.finfo(state.coef.dtype).eps  # type: ignore
 
     # line search by sequence beta^k, k=0, 1, ..
     # F(w + lambda d) - F(w) <= lambda * bound
@@ -792,7 +794,12 @@ def line_search(state: IRLSState, data: IRLSData, d: np.ndarray):
         )
         # 1. Check Armijo / sufficient decrease condition.
         loss_improvement = obj_val_wd - state.obj_val
-        if mu_wd.max() < 1e43 and loss_improvement <= factor * bound:
+        if mu_wd.dtype == np.float32:
+            large_number = 1e30
+        else:
+            large_number = 1e43
+
+        if mu_wd.max() < large_number and loss_improvement <= factor * bound:
             break
         # 2. Deal with relative loss differences around machine precision.
         tiny_loss = np.abs(state.obj_val * eps)  # type: ignore