This repository was archived by the owner on Jul 24, 2024. It is now read-only.

Commit de9b92b

eric-valenteStephen Hoover

authored and

Stephen Hoover

committed

Exposing the lower and upper limits V.2 (#41)

Follow the behavior of the R wrapper for allowing users to specify lower and upper limits on coefficients.

1 parent 87ca3af commit de9b92bCopy full SHA for de9b92b

File tree

4 files changed

+88

-15

lines changed

glmnet
- linear.py
- logistic.py
- tests
  - test_linear.py
  - test_logistic.py

4 files changed

+88

-15

lines changed

`‎glmnet/linear.py‎`

Lines changed: 35 additions & 7 deletions

Original file line number	Diff line number	Diff line change
`@@ -44,6 +44,15 @@ class ElasticNet(BaseEstimator):`
`44`	`44`	`will be on the scale of the original data regardless of the value`
`45`	`45`	`of standardize.`
`46`	`46`
	`47`	`+ lower_limits : array, (shape n_features,) default -infinity`
	`48`	`+ Array of lower limits for each coefficient, must be non-positive.`
	`49`	`+ Can be a single value (which is then replicated), else an array`
	`50`	`+ corresponding to the number of features.`
	`51`	`+`
	`52`	`+ upper_limits : array, (shape n_features,) default +infinity`
	`53`	`+ Array of upper limits for each coefficient, must be positive.`
	`54`	`+ See lower_limits.`
	`55`	`+`
`47`	`56`	`fit_intercept : bool, default True`
`48`	`57`	`Include an intercept term in the model.`
`49`	`58`
`@@ -128,6 +137,7 @@ class ElasticNet(BaseEstimator):`
`128`	`137`
`129`	`138`	`def __init__(self, alpha=1, n_lambda=100, min_lambda_ratio=1e-4,`
`130`	`139`	`lambda_path=None, standardize=True, fit_intercept=True,`
	`140`	`+ lower_limits=-np.inf, upper_limits=np.inf,`
`131`	`141`	`cut_point=1.0, n_splits=3, scoring=None, n_jobs=1, tol=1e-7,`
`132`	`142`	`max_iter=100000, random_state=None, max_features=None, verbose=False):`
`133`	`143`
`@@ -136,6 +146,8 @@ def __init__(self, alpha=1, n_lambda=100, min_lambda_ratio=1e-4,`
`136`	`146`	`self.min_lambda_ratio = min_lambda_ratio`
`137`	`147`	`self.lambda_path = lambda_path`
`138`	`148`	`self.standardize = standardize`
	`149`	`+ self.lower_limits = lower_limits`
	`150`	`+ self.upper_limits = upper_limits`
`139`	`151`	`self.fit_intercept = fit_intercept`
`140`	`152`	`self.cut_point = cut_point`
`141`	`153`	`self.n_splits = n_splits`
`@@ -146,7 +158,6 @@ def __init__(self, alpha=1, n_lambda=100, min_lambda_ratio=1e-4,`
`146`	`158`	`self.random_state = random_state`
`147`	`159`	`self.max_features = max_features`
`148`	`160`	`self.verbose = verbose`
`149`		`-`
`150`	`161`	`self.cv = None`
`151`	`162`
`152`	`163`	`def fit(self, X, y, sample_weight=None, relative_penalties=None):`
`@@ -185,16 +196,33 @@ def fit(self, X, y, sample_weight=None, relative_penalties=None):`
`185`	`196`	`self : object`
`186`	`197`	`Returns self.`
`187`	`198`	`"""`
	`199`	`+`
	`200`	`+ X, y = check_X_y(X, y, accept_sparse='csr', ensure_min_samples=2)`
	`201`	`+ if sample_weight is None:`
	`202`	`+ sample_weight = np.ones(X.shape[0])`
	`203`	`+`
	`204`	`+ if not np.isscalar(self.lower_limits):`
	`205`	`+ self.lower_limits = np.asarray(self.lower_limits)`
	`206`	`+ if len(self.lower_limits) != X.shape[1]:`
	`207`	`+ raise ValueError("lower_limits must equal number of features")`
	`208`	`+`
	`209`	`+ if not np.isscalar(self.upper_limits):`
	`210`	`+ self.upper_limits = np.asarray(self.upper_limits)`
	`211`	`+ if len(self.upper_limits) != X.shape[1]:`
	`212`	`+ raise ValueError("upper_limits must equal number of features")`
	`213`	`+`
	`214`	`+ if any(self.lower_limits > 0) if isinstance(self.lower_limits, np.ndarray) else self.lower_limits > 0:`
	`215`	`+ raise ValueError("lower_limits must be non-positive")`
	`216`	`+`
	`217`	`+ if any(self.upper_limits < 0) if isinstance(self.upper_limits, np.ndarray) else self.upper_limits < 0:`
	`218`	`+ raise ValueError("upper_limits must be positive")`
	`219`	`+`
`188`	`220`	`if self.alpha > 1 or self.alpha < 0:`
`189`	`221`	`raise ValueError("alpha must be between 0 and 1")`
`190`	`222`
`191`	`223`	`if self.n_splits > 0 and self.n_splits < 3:`
`192`	`224`	`raise ValueError("n_splits must be at least 3")`
`193`	`225`
`194`		`- X, y = check_X_y(X, y, accept_sparse='csr', ensure_min_samples=2)`
`195`		`- if sample_weight is None:`
`196`		`- sample_weight = np.ones(X.shape[0])`
`197`		`-`
`198`	`226`	`self._fit(X, y, sample_weight, relative_penalties)`
`199`	`227`
`200`	`228`	`if self.n_splits >= 3:`
`@@ -247,8 +275,8 @@ def _fit(self, X, y, sample_weight, relative_penalties):`
`247`	`275`	`order='F')`
`248`	`276`
`249`	`277`	`coef_bounds = np.empty((2, X.shape[1]), dtype=np.float64, order='F')`
`250`		`- coef_bounds[0, :] = -np.inf`
`251`		`- coef_bounds[1, :] = np.inf`
	`278`	`+ coef_bounds[0, :] = self.lower_limits`
	`279`	`+ coef_bounds[1, :] = self.upper_limits`
`252`	`280`
`253`	`281`	`if X.shape[1] > X.shape[0]:`
`254`	`282`	`# the glmnet docs suggest using a different algorithm for the case`

`‎glmnet/logistic.py‎`

Lines changed: 35 additions & 8 deletions

Original file line number	Diff line number	Diff line change
`@@ -48,6 +48,15 @@ class LogitNet(BaseEstimator):`
`48`	`48`
`49`	`49`	`fit_intercept : bool, default True`
`50`	`50`	`Include an intercept term in the model.`
	`51`	`+`
	`52`	`+ lower_limits : array, (shape n_features,) default -infinity`
	`53`	`+ Array of lower limits for each coefficient, must be non-positive.`
	`54`	`+ Can be a single value (which is then replicated), else an array`
	`55`	`+ corresponding to the number of features.`
	`56`	`+`
	`57`	`+ upper_limits : array, (shape n_features,) default +infinity`
	`58`	`+ Array of upper limits for each coefficient, must be positive.`
	`59`	`+ See lower_limits.`
`51`	`60`
`52`	`61`	`cut_point : float, default 1`
`53`	`62`	`The cut point to use for selecting lambda_best.`
`@@ -133,6 +142,7 @@ class LogitNet(BaseEstimator):`
`133`	`142`
`134`	`143`	`def __init__(self, alpha=1, n_lambda=100, min_lambda_ratio=1e-4,`
`135`	`144`	`lambda_path=None, standardize=True, fit_intercept=True,`
	`145`	`+ lower_limits=-np.inf, upper_limits=np.inf,`
`136`	`146`	`cut_point=1.0, n_splits=3, scoring=None, n_jobs=1, tol=1e-7,`
`137`	`147`	`max_iter=100000, random_state=None, max_features=None, verbose=False):`
`138`	`148`
`@@ -141,6 +151,8 @@ def __init__(self, alpha=1, n_lambda=100, min_lambda_ratio=1e-4,`
`141`	`151`	`self.min_lambda_ratio = min_lambda_ratio`
`142`	`152`	`self.lambda_path = lambda_path`
`143`	`153`	`self.standardize = standardize`
	`154`	`+ self.lower_limits = lower_limits`
	`155`	`+ self.upper_limits = upper_limits`
`144`	`156`	`self.fit_intercept = fit_intercept`
`145`	`157`	`self.cut_point = cut_point`
`146`	`158`	`self.n_splits = n_splits`
`@@ -151,7 +163,6 @@ def __init__(self, alpha=1, n_lambda=100, min_lambda_ratio=1e-4,`
`151`	`163`	`self.random_state = random_state`
`152`	`164`	`self.max_features = max_features`
`153`	`165`	`self.verbose = verbose`
`154`		`-`
`155`	`166`	`self.cv = None`
`156`	`167`
`157`	`168`	`def fit(self, X, y, sample_weight=None, relative_penalties=None):`
`@@ -190,12 +201,28 @@ def fit(self, X, y, sample_weight=None, relative_penalties=None):`
`190`	`201`	`self : object`
`191`	`202`	`Returns self.`
`192`	`203`	`"""`
`193`		`- if self.alpha > 1 or self.alpha < 0:`
`194`		`- raise ValueError("alpha must be between 0 and 1")`
`195`		`-`
`196`	`204`	`X, y = check_X_y(X, y, accept_sparse='csr', ensure_min_samples=2)`
`197`	`205`	`if sample_weight is None:`
`198`		`- sample_weight = np.ones(X.shape[0])`
	`206`	`+ sample_weight = np.ones(X.shape[0])`
	`207`	`+`
	`208`	`+ if not np.isscalar(self.lower_limits):`
	`209`	`+ self.lower_limits = np.asarray(self.lower_limits)`
	`210`	`+ if len(self.lower_limits) != X.shape[1]:`
	`211`	`+ raise ValueError("lower_limits must equal number of features")`
	`212`	`+`
	`213`	`+ if not np.isscalar(self.upper_limits):`
	`214`	`+ self.upper_limits = np.asarray(self.upper_limits)`
	`215`	`+ if len(self.upper_limits) != X.shape[1]:`
	`216`	`+ raise ValueError("upper_limits must equal number of features")`
	`217`	`+`
	`218`	`+ if any(self.lower_limits > 0) if isinstance(self.lower_limits, np.ndarray) else self.lower_limits > 0:`
	`219`	`+ raise ValueError("lower_limits must be non-positive")`
	`220`	`+`
	`221`	`+ if any(self.upper_limits < 0) if isinstance(self.upper_limits, np.ndarray) else self.upper_limits < 0:`
	`222`	`+ raise ValueError("upper_limits must be positive")`
	`223`	`+`
	`224`	`+ if self.alpha > 1 or self.alpha < 0:`
	`225`	`+ raise ValueError("alpha must be between 0 and 1")`
`199`	`226`
`200`	`227`	`# fit the model`
`201`	`228`	`self._fit(X, y, sample_weight, relative_penalties)`
`@@ -293,9 +320,9 @@ def _fit(self, X, y, sample_weight=None, relative_penalties=None):`
`293`	`320`	`relative_penalties = np.ones(X.shape[1], dtype=np.float64,`
`294`	`321`	`order='F')`
`295`	`322`
`296`		`- coef_bounds = np.empty((2, X.shape[1]), dtype=np.float64, order='F')`
`297`		`- coef_bounds[0, :] = -np.inf`
`298`		`- coef_bounds[1, :] = np.inf`
	`323`	`+ coef_bounds = np.empty((2, X.shape[1]), dtype=np.float64, order='F')`
	`324`	`+ coef_bounds[0, :] = self.lower_limits`
	`325`	`+ coef_bounds[1, :] = self.upper_limits`
`299`	`326`
`300`	`327`	`if n_classes == 2:`
`301`	`328`	`# binomial, tell glmnet there is only one class`

`‎glmnet/tests/test_linear.py‎`

Lines changed: 9 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -102,6 +102,15 @@ def test_alphas(self):`
`102`	`102`	`m = m.fit(x, y)`
`103`	`103`	`self.check_r2_score(y, m.predict(x), 0.90, alpha=alpha)`
`104`	`104`
	`105`	`+ def test_coef_limits(self):`
	`106`	`+ x, y = self.inputs[0]`
	`107`	`+ lower_limits = np.repeat(-1, x.shape[1])`
	`108`	`+ upper_limits = 0`
	`109`	`+ m = ElasticNet(lower_limits=lower_limits, upper_limits=upper_limits, random_state=5934, alpha=0)`
	`110`	`+ m = m.fit(x, y)`
	`111`	`+ assert(np.all(m.coef_ >= -1))`
	`112`	`+ assert(np.all(m.coef_ <= 0))`
	`113`	`+`
`105`	`114`	`def test_n_splits(self):`
`106`	`115`	`x, y = self.inputs[0]`
`107`	`116`	`for n in self.n_splits:`

`‎glmnet/tests/test_logistic.py‎`

Lines changed: 9 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -92,6 +92,15 @@ def test_alphas(self):`
`92`	`92`	`m = m.fit(x, y)`
`93`	`93`	`check_accuracy(y, m.predict(x), 0.85, alpha=alpha)`
`94`	`94`
	`95`	`+ def test_coef_limits(self):`
	`96`	`+ x, y = self.binomial[0]`
	`97`	`+ lower_limits = np.repeat(-1, x.shape[1])`
	`98`	`+ upper_limits = 0`
	`99`	`+ m = LogitNet(lower_limits=lower_limits, upper_limits=upper_limits, random_state=69265, alpha=0)`
	`100`	`+ m = m.fit(x, y)`
	`101`	`+ assert(np.all(m.coef_ >= -1))`
	`102`	`+ assert(np.all(m.coef_ <= 0))`
	`103`	`+`
`95`	`104`	`def test_relative_penalties(self):`
`96`	`105`	`x, y = self.binomial[0]`
`97`	`106`	`p = x.shape[1]`

0 commit comments

Comments

(0)

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit de9b92b

File tree

4 files changed

4 files changed

`‎glmnet/linear.py‎`

`‎glmnet/logistic.py‎`

`‎glmnet/tests/test_linear.py‎`

`‎glmnet/tests/test_logistic.py‎`

0 commit comments