seckcoder
diff --git a/‎sklearn/linear_model/stochastic_gradient.py
Lines changed: 78 additions & 62 deletions b/‎sklearn/linear_model/stochastic_gradient.py
Lines changed: 78 additions & 62 deletions
@@ -36,6 +36,9 @@
 """For sparse data intercept updates are scaled by this decay factor to avoid
 intercept oscillation."""
 
+DEFAULT_EPSILON = 0.1
+"""Default value of ``epsilon`` parameter. """
+
 
 class BaseSGD(BaseEstimator):
     """Base class for SGD classification and regression."""
@@ -46,44 +49,32 @@ def __init__(self, loss, penalty='l2', alpha=0.0001,
                  rho=0.85, fit_intercept=True, n_iter=5, shuffle=False,
                  verbose=0, epsilon=0.1, seed=0, learning_rate="optimal",
                  eta0=0.0, power_t=0.5, warm_start=False):
-        self.loss = str(loss)
-        self.penalty = str(penalty).lower()
-        self.learning_rate = str(learning_rate)
-
-        # raises ValueError if not registered
-        self.get_penalty_type(self.penalty)
-        self.get_learning_rate_type(self.learning_rate)
-
-        self.epsilon = float(epsilon)
-        self.alpha = float(alpha)
-        if self.alpha < 0.0:
-            raise ValueError("alpha must be greater than zero")
-        self.rho = float(rho)
-        if self.rho < 0.0 or self.rho > 1.0:
-            raise ValueError("rho must be in [0, 1]")
-        self.fit_intercept = bool(fit_intercept)
-        self.n_iter = int(n_iter)
-        if self.n_iter <= 0:
-            raise ValueError("n_iter must be greater than zero")
-        if not isinstance(shuffle, bool):
-            raise ValueError("shuffle must be either True or False")
-        self.shuffle = bool(shuffle)
+        self.loss = loss
+        self.penalty = penalty
+        self.learning_rate = learning_rate
+        self.epsilon = epsilon
+        self.alpha = alpha
+        self.rho = rho
+        self.fit_intercept = fit_intercept
+        self.n_iter = n_iter
+        self.shuffle = shuffle
         self.seed = seed
-        self.verbose = int(verbose)
-
-        self.eta0 = float(eta0)
-        self.power_t = float(power_t)
-        if self.learning_rate != "optimal":
-            if eta0 <= 0.0:
-                raise ValueError("eta0 must be greater than 0.0")
-        self.coef_ = None
+        self.verbose = verbose
+        self.eta0 = eta0
+        self.power_t = power_t
         self.warm_start = warm_start
 
-        #self._init_t()
+        self._validate_params()
+
+        self.coef_ = None
         # iteration count for learning rate schedule
         # must not be int (e.g. if ``learning_rate=='optimal'``)
         self.t_ = None
 
+    def set_params(self, *args, **kwargs):
+        super(BaseSGD, self).set_params(*args, **kwargs)
+        self._validate_params()
+
     @abstractmethod
     def fit(self, X, y):
         """Fit model."""
@@ -92,6 +83,27 @@ def fit(self, X, y):
     def predict(self, X):
         """Predict using model."""
 
+    def _validate_params(self):
+        """Validate input params. """
+        if not isinstance(self.shuffle, bool):
+            raise ValueError("shuffle must be either True or False")
+        if self.n_iter <= 0:
+            raise ValueError("n_iter must be greater than zero")
+        if not (0.0 <= self.rho <= 1.0):
+            raise ValueError("rho must be in [0, 1]")
+        if self.alpha < 0.0:
+            raise ValueError("alpha must be greater than zero")
+        if self.learning_rate != "optimal":
+            if self.eta0 <= 0.0:
+                raise ValueError("eta0 must be greater than 0.0")
+
+        # raises ValueError if not registered
+        self._get_penalty_type(self.penalty)
+        self._get_learning_rate_type(self.learning_rate)
+
+        if self.loss not in self.loss_functions:
+            raise ValueError("The loss %s is not supported. " % self.loss)
+
     def _init_t(self, loss_function):
         """Initialize iteration counter attr ``t_``.
 
@@ -111,18 +123,21 @@ def get_loss_function(self, loss):
         try:
             loss_ = self.loss_functions[loss]
             loss_class, args = loss_[0], loss_[1:]
+            if loss in ('huber', 'epsilon_insensitive'):
+                args = (self.epsilon, )
             return loss_class(*args)
         except KeyError:
             raise ValueError("The loss %s is not supported. " % loss)
 
-    def get_learning_rate_type(self, learning_rate):
+    def _get_learning_rate_type(self, learning_rate):
         try:
             return LEARNING_RATE_TYPES[learning_rate]
         except KeyError:
             raise ValueError("learning rate %s"
                              "is not supported. " % learning_rate)
 
-    def get_penalty_type(self, penalty):
+    def _get_penalty_type(self, penalty):
+        penalty = str(penalty).lower()
         try:
             return PENALTY_TYPES[penalty]
         except KeyError:
@@ -338,9 +353,20 @@ class SGDClassifier(BaseSGD, ClassifierMixin, SelectorMixin):
     LinearSVC, LogisticRegression, Perceptron
 
     """
+
+    loss_functions = {
+        "hinge": (Hinge, 1.0),
+        "perceptron": (Hinge, 0.0),
+        "log": (Log, ),
+        "modified_huber": (ModifiedHuber, ),
+        "squared_loss": (SquaredLoss, ),
+        "huber": (Huber, DEFAULT_EPSILON),
+        "epsilon_insensitive": (EpsilonInsensitive, DEFAULT_EPSILON),
+    }
+
     def __init__(self, loss="hinge", penalty='l2', alpha=0.0001,
                  rho=0.85, fit_intercept=True, n_iter=5, shuffle=False,
-                 verbose=0, epsilon=0.1, n_jobs=1, seed=0,
+                 verbose=0, epsilon=DEFAULT_EPSILON, n_jobs=1, seed=0,
                  learning_rate="optimal", eta0=0.0, power_t=0.5,
                  class_weight=None, warm_start=False):
         super(SGDClassifier, self).__init__(loss=loss, penalty=penalty,
@@ -356,18 +382,6 @@ def __init__(self, loss="hinge", penalty='l2', alpha=0.0001,
         self.classes_ = None
         self.n_jobs = int(n_jobs)
 
-        self.loss_functions = {
-            "hinge": (Hinge, 1.0),
-            "perceptron": (Hinge, 0.0),
-            "log": (Log, ),
-            "modified_huber": (ModifiedHuber, ),
-            "squared_loss": (SquaredLoss, ),
-            "huber": (Huber, self.epsilon),
-            "epsilon_insensitive": (EpsilonInsensitive, self.epsilon),
-        }
-        if loss not in self.loss_functions:
-            raise ValueError("The loss %s is not supported. " % loss)
-
     @property
     @deprecated("to be removed in v0.13; use ``classes_`` instead.")
     def classes(self):
@@ -406,6 +420,8 @@ def _partial_fit(self, X, y, n_iter, classes=None, sample_weight=None,
         n_samples, n_features = X.shape
         _check_fit_data(X, y)
 
+        self._validate_params()
+
         if self.classes_ is None and classes is None:
             raise ValueError("classes must be passed on the first call "
                              "to partial_fit.")
@@ -696,13 +712,13 @@ def fit_binary(est, i, X, y, n_iter, pos_weight, neg_weight,
     assert y_i.shape[0] == y.shape[0] == sample_weight.shape[0]
     dataset, intercept_decay = _make_dataset(X, y_i, sample_weight)
 
-    penalty_type = est.get_penalty_type(est.penalty)
-    learning_rate_type = est.get_learning_rate_type(est.learning_rate)
+    penalty_type = est._get_penalty_type(est.penalty)
+    learning_rate_type = est._get_learning_rate_type(est.learning_rate)
 
     return plain_sgd(coef, intercept, est.loss_function,
                      penalty_type, est.alpha, est.rho,
-                     dataset, n_iter, est.fit_intercept,
-                     est.verbose, est.shuffle, est.seed,
+                     dataset, n_iter, int(est.fit_intercept),
+                     int(est.verbose), int(est.shuffle), est.seed,
                      pos_weight, neg_weight,
                      learning_rate_type, est.eta0,
                      est.power_t, est.t_, intercept_decay)
@@ -812,6 +828,13 @@ class SGDRegressor(BaseSGD, RegressorMixin, SelectorMixin):
     Ridge, ElasticNet, Lasso, SVR
 
     """
+
+    loss_functions = {
+        "squared_loss": (SquaredLoss, ),
+        "huber": (Huber, DEFAULT_EPSILON),
+        "epsilon_insensitive": (EpsilonInsensitive, DEFAULT_EPSILON)
+    }
+
     def __init__(self, loss="squared_loss", penalty="l2", alpha=0.0001,
             rho=0.85, fit_intercept=True, n_iter=5, shuffle=False, verbose=0,
             epsilon=0.1, p=None, seed=0, learning_rate="invscaling", eta0=0.01,
@@ -834,14 +857,6 @@ def __init__(self, loss="squared_loss", penalty="l2", alpha=0.0001,
                                            eta0=eta0, power_t=power_t,
                                            warm_start=False)
 
-        self.loss_functions = {
-            "squared_loss": (SquaredLoss, ),
-            "huber": (Huber, self.epsilon),
-            "epsilon_insensitive": (EpsilonInsensitive, self.epsilon)
-        }
-        if loss not in self.loss_functions:
-            raise ValueError("The loss %s is not supported. " % loss)
-
     def _partial_fit(self, X, y, n_iter, sample_weight=None,
                      coef_init=None, intercept_init=None):
         X, y = check_arrays(X, y, sparse_format="csr", copy=False,
@@ -851,6 +866,8 @@ def _partial_fit(self, X, y, n_iter, sample_weight=None,
         n_samples, n_features = X.shape
         _check_fit_data(X, y)
 
+        self._validate_params()
+
         # Allocate datastructures from input arguments
         sample_weight = self._validate_sample_weight(sample_weight, n_samples)
 
@@ -919,8 +936,7 @@ def fit(self, X, y, coef_init=None, intercept_init=None,
             self.coef_ = None
             self.intercept_ = None
 
-        # Need to re-initialize in case of multiple call to fit.
-        #self._init_t()
+        # Clear iteration count for multiple call to fit.
         self.t_ = None
 
         return self._partial_fit(X, y, self.n_iter, sample_weight,
@@ -960,8 +976,8 @@ def _fit_regressor(self, X, y, sample_weight, n_iter):
         dataset, intercept_decay = _make_dataset(X, y, sample_weight)
 
         loss_function = self.get_loss_function(self.loss)
-
penalty_type = self.get_penalty_type(self.penalty)        penalty_type = self.get_penalty_type(self.penalty)
-        learning_rate_type = self.get_learning_rate_type(self.learning_rate)
+        penalty_type = self._get_penalty_type(self.penalty)
+        learning_rate_type = self._get_learning_rate_type(self.learning_rate)
 
         if self.t_ is None:
             self._init_t(loss_function)