statistical-python · ngierty · Dec 1, 2021 · Dec 1, 2021 · Dec 2, 2021 · Dec 2, 2021
diff --git a/yaglm/config/penalty.py b/yaglm/config/penalty.py
@@ -31,7 +31,7 @@ class Ridge(WithPenSeqConfig):
         (Optional) Weights for each term in the penalty.
     """
     @autoassign
-    def __init__(self, pen_val=1, weights=None): pass
+    def __init__(self, pen_val=1, weights=None, targ_ubd=1): pass
 
     def get_pen_val_max(self, X, y, loss, fit_intercept=True,
                         sample_weight=None, init_data=None):
@@ -40,7 +40,7 @@ def get_pen_val_max(self, X, y, loss, fit_intercept=True,
                                  weights=self.weights,
                                  fit_intercept=fit_intercept,
                                  sample_weight=sample_weight,
-                                 targ_ubd=1,
+                                 targ_ubd=self.targ_ubd,
                                  norm_by_dim=True)
 
 
@@ -310,12 +310,12 @@ class ElasticNet(ElasticNetConfig):
     """
     Represents the ElasticNet penalty
 
-    pen_val * mix_val ||coef||_1 + 0.5 * pen_val * (1 - mix_val) * ||coef||_2^2
+    pen_val * mix_val ||coef||_1 + pen_val * (1 - mix_val) * ||coef||_2^2
 
     The Lasso may have weights (though not the ridge at this time) or may be flavored.
     We define the non-convex elastic net as
 
-    non-convex_{pen_val * mix_val} (coef) + 0.5 * pen_val * (1 - mix_val) * ||coef||_2^2
+    non-convex_{pen_val * mix_val} (coef) + pen_val * (1 - mix_val) * ||coef||_2^2
 
     Parameters
     ----------

diff --git a/yaglm/infer/Inferencer.py b/yaglm/infer/Inferencer.py
@@ -6,7 +6,7 @@
 from yaglm.config.base import Config
 from yaglm.autoassign import autoassign
 from yaglm.config.penalty import Lasso
-from yaglm.infer.dof import est_dof_support
+from yaglm.infer.dof import est_dof_support, est_dof_enet
 from yaglm.utils import is_fitted
 from yaglm.config.loss import get_loss_config
 
@@ -136,6 +136,15 @@ def after_fit(self, estimator, X, y, sample_weight=None):
             else:
                 # we don't currently support estimating the DoF for this model
                 self.dof_ = None
+
+        elif self.dof == 'enet':
+
+            self.dof_ = est_dof_enet(coef = estimator.coef_,
+                                     pen_val=estimator.fit_penalty_.pen_val,
+                                     mix_val=estimator.fit_penalty_.mix_val,
+                                     X = X,
+                                     intercept=estimator.intercept_,
+                                     zero_tol=zero_tol)
 
         elif isinstance(self.dof, Number):
             # user provided DOF value

diff --git a/yaglm/infer/dof.py b/yaglm/infer/dof.py
@@ -49,3 +49,66 @@ def est_dof_support(coef, intercept=None, transform=None, zero_tol=1e-6):
 
     DoF = n_nonzero_coef + n_vals_intercept
     return DoF
+
+
+def est_dof_enet(coef, pen_val, mix_val, X, intercept=None, zero_tol=1e-6):
+
+    """
+    The size of the support of the estimated coefficient for elastic net at a particular 
+    penalty and mixing value.
+
+    ElasticNet penalty:
+
+    pen_val * mix_val ||coef||_1 + pen_val * (1 - mix_val) * ||coef||_2^2
+
+    Parameters
+    ----------
+    coef: array-like
+        The estimated coefficient.
+
+    pen_val: float,
+        current penalty value in the elastic net penalty
+
+    mix_val: float,
+        current mixing value in the elastic net penalty
+
+    X: (n,d)-array,
+        design matrix excluding the intercept column
+
+    intercept: None, float, array-like
+        (Optional) The estimated coefficeint.
+
+    zero_tol: float
+        Tolerance for declaring a small value equal to zero. This addresses numerical issues where some solvers may not return exact zeros.
+
+    Output
+    ------
+    DoF: int
+        The estimaed number of degrees of freedom. The DoF of the coefficeint is given by either ||coef||_0 or ||transform(coef)||_0
+
+    References
+    ----------
+    Zou, H., Hastie, T. and Tibshirani, R., 2007. On the “degrees of freedom” of the lasso. The Annals of Statistics, 35(5), pp.2173-2192.
+    """
+
+    # Get the estimated support from the fitted coefficient
+    if intercept is not None:
+        coef = np.concatenate([[intercept], coef])
+
+    support = (abs(coef) > zero_tol)
+
+    # tuning parameter attached to the ridge penalty
+    lambda_2 = pen_val * (1 - mix_val)
+
+    # Get the columns of the design matrix that correspond to the non-zero coef
+    if intercept is not None:
+        ones = np.ones((X.shape[0], 1))
+        X = np.concatenate([ones, X], axis = 1)
+
+    X_A = X[:, support].copy()
+
+    xtx_li_inv = np.linalg.inv(X_A.T @ X_A + lambda_2 * np.identity(X_A.shape[1]))
+
+    DoF = np.trace(X_A @ xtx_li_inv @ X_A.T)
+
+    return(DoF)