COSMIT move BaseSGD to its only place of usage

larsmans · larsmans · commit 7c8f435469c3 · 2012-08-01T15:25:36.000+02:00
diff --git a/sklearn/linear_model/base.py b/sklearn/linear_model/base.py
@@ -21,7 +21,7 @@
 from ..base import BaseEstimator
 from ..base import RegressorMixin
 from ..utils.extmath import safe_sparse_dot
-from ..utils import array2d, as_float_array, safe_asarray
+from ..utils import as_float_array, safe_asarray
 from ..utils.fixes import lsqr
 from ..utils.sparsefuncs import csc_mean_variance_axis0, \
                                 inplace_csc_column_scale
@@ -222,161 +222,3 @@ def fit(self, X, y, n_jobs=1):
             self.coef_ = np.ravel(self.coef_)
         self._set_intercept(X_mean, y_mean, X_std)
         return self
-
-##
-## Stochastic Gradient Descent (SGD) abstract base class
-##
-
-
-class BaseSGD(BaseEstimator):
-    """Base class for dense and sparse SGD."""
-
-    __metaclass__ = ABCMeta
-
-    def __init__(self, loss, penalty='l2', alpha=0.0001,
-                 rho=0.85, fit_intercept=True, n_iter=5, shuffle=False,
-                 verbose=0, epsilon=0.1, seed=0, learning_rate="optimal",
-                 eta0=0.0, power_t=0.5, warm_start=False):
-        self.loss = str(loss)
-        self.penalty = str(penalty).lower()
-        self.epsilon = float(epsilon)
-        self._set_loss_function(self.loss)
-        self._set_penalty_type(self.penalty)
-
-        self.alpha = float(alpha)
-        if self.alpha < 0.0:
-            raise ValueError("alpha must be greater than zero")
-        self.rho = float(rho)
-        if self.rho < 0.0 or self.rho > 1.0:
-            raise ValueError("rho must be in [0, 1]")
-        self.fit_intercept = bool(fit_intercept)
-        self.n_iter = int(n_iter)
-        if self.n_iter <= 0:
-            raise ValueError("n_iter must be greater than zero")
-        if not isinstance(shuffle, bool):
-            raise ValueError("shuffle must be either True or False")
-        self.shuffle = bool(shuffle)
-        self.seed = seed
-        self.verbose = int(verbose)
-
-        self.learning_rate = str(learning_rate)
-        self._set_learning_rate(self.learning_rate)
-        self.eta0 = float(eta0)
-        self.power_t = float(power_t)
-        if self.learning_rate != "optimal":
-            if eta0 <= 0.0:
-                raise ValueError("eta0 must be greater than 0.0")
-        self.coef_ = None
-        self.warm_start = warm_start
-
-        self._init_t()
-
-    @abstractmethod
-    def fit(self, X, y):
-        """Fit model."""
-
-    @abstractmethod
-    def predict(self, X):
-        """Predict using model."""
-
-    def _init_t(self):
-        self.t_ = 1.0
-        if self.learning_rate == "optimal":
-            typw = np.sqrt(1.0 / np.sqrt(self.alpha))
-            # computing eta0, the initial learning rate
-            eta0 = typw / max(1.0, self.loss_function.dloss(-typw, 1.0))
-            # initialize t such that eta at first example equals eta0
-            self.t_ = 1.0 / (eta0 * self.alpha)
-
-    def _set_learning_rate(self, learning_rate):
-        learning_rate_codes = {"constant": 1, "optimal": 2, "invscaling": 3}
-        try:
-            self.learning_rate_code = learning_rate_codes[learning_rate]
-        except KeyError:
-            raise ValueError("learning rate %s"
-            "is not supported. " % learning_rate)
-
-    def _set_loss_function(self, loss):
-        """Get concrete LossFunction"""
-        raise NotImplementedError("BaseSGD is an abstract class.")
-
-    def _set_penalty_type(self, penalty):
-        penalty_types = {"none": 0, "l2": 2, "l1": 1, "elasticnet": 3}
-        try:
-            self.penalty_type = penalty_types[penalty]
-        except KeyError:
-            raise ValueError("Penalty %s is not supported. " % penalty)
-
-    def _validate_sample_weight(self, sample_weight, n_samples):
-        """Set the sample weight array."""
-        if sample_weight == None:
-            # uniform sample weights
-            sample_weight = np.ones(n_samples, dtype=np.float64, order='C')
-        else:
-            # user-provided array
-            sample_weight = np.asarray(sample_weight, dtype=np.float64,
-                                       order="C")
-        if sample_weight.shape[0] != n_samples:
-            raise ValueError("Shapes of X and sample_weight do not match.")
-        return sample_weight
-
-    def _set_coef(self, coef_):
-        """Make sure that coef_ is fortran-style and 2d.
-
-        Fortran-style memory layout is needed to ensure that computing
-        the dot product between input ``X`` and ``coef_`` does not trigger
-        a memory copy.
-        """
-        self.coef_ = np.asfortranarray(array2d(coef_))
-
-    def _allocate_parameter_mem(self, n_classes, n_features, coef_init=None,
-                                intercept_init=None):
-        """Allocate mem for parameters; initialize if provided."""
-        if n_classes > 2:
-            # allocate coef_ for multi-class
-            if coef_init is not None:
-                coef_init = np.asarray(coef_init, order="C")
-                if coef_init.shape != (n_classes, n_features):
-                    raise ValueError("Provided coef_ does not match dataset. ")
-                self.coef_ = coef_init
-            else:
-                self.coef_ = np.zeros((n_classes, n_features),
-                                      dtype=np.float64, order="C")
-
-            # allocate intercept_ for multi-class
-            if intercept_init is not None:
-                intercept_init = np.asarray(intercept_init, order="C")
-                if intercept_init.shape != (n_classes, ):
-                    raise ValueError("Provided intercept_init " \
-                                     "does not match dataset.")
-                self.intercept_ = intercept_init
-            else:
-                self.intercept_ = np.zeros(n_classes, dtype=np.float64,
-                                           order="C")
-        else:
-            # allocate coef_ for binary problem
-            if coef_init is not None:
-                coef_init = np.asarray(coef_init, dtype=np.float64,
-                                       order="C")
-                coef_init = coef_init.ravel()
-                if coef_init.shape != (n_features,):
-                    raise ValueError("Provided coef_init does not " \
-                                     "match dataset.")
-                self.coef_ = coef_init
-            else:
-                self.coef_ = np.zeros(n_features, dtype=np.float64, order="C")
-
-            # allocate intercept_ for binary problem
-            if intercept_init is not None:
-                intercept_init = np.asarray(intercept_init, dtype=np.float64)
-                if intercept_init.shape != (1,) and intercept_init.shape != ():
-                    raise ValueError("Provided intercept_init " \
-                                 "does not match dataset.")
-                self.intercept_ = intercept_init.reshape(1,)
-            else:
-                self.intercept_ = np.zeros(1, dtype=np.float64, order="C")
-
-    def _check_fit_data(self, X, y):
-        n_samples, _ = X.shape
-        if n_samples != y.shape[0]:
-            raise ValueError("Shapes of X and y do not match.")
diff --git a/sklearn/linear_model/stochastic_gradient.py b/sklearn/linear_model/stochastic_gradient.py
@@ -6,17 +6,16 @@
 
 import numpy as np
 import scipy.sparse as sp
+
+from abc import ABCMeta, abstractmethod
 import warnings
 
 from ..externals.joblib import Parallel, delayed
 
-from ..base import RegressorMixin
-from ..base import ClassifierMixin
+from ..base import BaseEstimator, ClassifierMixin, RegressorMixin
 from ..feature_selection.selector_mixin import SelectorMixin
-from .base import BaseSGD
-from ..utils import atleast2d_or_csr, check_arrays
+from ..utils import array2d, atleast2d_or_csr, check_arrays, safe_asarray
 from ..utils.extmath import safe_sparse_dot
-from ..utils import safe_asarray
 from ..utils import deprecated
 
 from .sgd_fast import plain_sgd as plain_sgd
@@ -29,6 +28,160 @@
 from .sgd_fast import EpsilonInsensitive
 
 
+class BaseSGD(BaseEstimator):
+    """Base class for dense and sparse SGD."""
+
+    __metaclass__ = ABCMeta
+
+    def __init__(self, loss, penalty='l2', alpha=0.0001,
+                 rho=0.85, fit_intercept=True, n_iter=5, shuffle=False,
+                 verbose=0, epsilon=0.1, seed=0, learning_rate="optimal",
+                 eta0=0.0, power_t=0.5, warm_start=False):
+        self.loss = str(loss)
+        self.penalty = str(penalty).lower()
+        self.epsilon = float(epsilon)
+        self._set_loss_function(self.loss)
+        self._set_penalty_type(self.penalty)
+
+        self.alpha = float(alpha)
+        if self.alpha < 0.0:
+            raise ValueError("alpha must be greater than zero")
+        self.rho = float(rho)
+        if self.rho < 0.0 or self.rho > 1.0:
+            raise ValueError("rho must be in [0, 1]")
+        self.fit_intercept = bool(fit_intercept)
+        self.n_iter = int(n_iter)
+        if self.n_iter <= 0:
+            raise ValueError("n_iter must be greater than zero")
+        if not isinstance(shuffle, bool):
+            raise ValueError("shuffle must be either True or False")
+        self.shuffle = bool(shuffle)
+        self.seed = seed
+        self.verbose = int(verbose)
+
+        self.learning_rate = str(learning_rate)
+        self._set_learning_rate(self.learning_rate)
+        self.eta0 = float(eta0)
+        self.power_t = float(power_t)
+        if self.learning_rate != "optimal":
+            if eta0 <= 0.0:
+                raise ValueError("eta0 must be greater than 0.0")
+        self.coef_ = None
+        self.warm_start = warm_start
+
+        self._init_t()
+
+    @abstractmethod
+    def fit(self, X, y):
+        """Fit model."""
+
+    @abstractmethod
+    def predict(self, X):
+        """Predict using model."""
+
+    def _init_t(self):
+        self.t_ = 1.0
+        if self.learning_rate == "optimal":
+            typw = np.sqrt(1.0 / np.sqrt(self.alpha))
+            # computing eta0, the initial learning rate
+            eta0 = typw / max(1.0, self.loss_function.dloss(-typw, 1.0))
+            # initialize t such that eta at first example equals eta0
+            self.t_ = 1.0 / (eta0 * self.alpha)
+
+    def _set_learning_rate(self, learning_rate):
+        learning_rate_codes = {"constant": 1, "optimal": 2, "invscaling": 3}
+        try:
+            self.learning_rate_code = learning_rate_codes[learning_rate]
+        except KeyError:
+            raise ValueError("learning rate %s"
+            "is not supported. " % learning_rate)
+
+    def _set_loss_function(self, loss):
+        """Get concrete LossFunction"""
+        raise NotImplementedError("BaseSGD is an abstract class.")
+
+    def _set_penalty_type(self, penalty):
+        penalty_types = {"none": 0, "l2": 2, "l1": 1, "elasticnet": 3}
+        try:
+            self.penalty_type = penalty_types[penalty]
+        except KeyError:
+            raise ValueError("Penalty %s is not supported. " % penalty)
+
+    def _validate_sample_weight(self, sample_weight, n_samples):
+        """Set the sample weight array."""
+        if sample_weight == None:
+            # uniform sample weights
+            sample_weight = np.ones(n_samples, dtype=np.float64, order='C')
+        else:
+            # user-provided array
+            sample_weight = np.asarray(sample_weight, dtype=np.float64,
+                                       order="C")
+        if sample_weight.shape[0] != n_samples:
+            raise ValueError("Shapes of X and sample_weight do not match.")
+        return sample_weight
+
+    def _set_coef(self, coef_):
+        """Make sure that coef_ is fortran-style and 2d.
+
+        Fortran-style memory layout is needed to ensure that computing
+        the dot product between input ``X`` and ``coef_`` does not trigger
+        a memory copy.
+        """
+        self.coef_ = np.asfortranarray(array2d(coef_))
+
+    def _allocate_parameter_mem(self, n_classes, n_features, coef_init=None,
+                                intercept_init=None):
+        """Allocate mem for parameters; initialize if provided."""
+        if n_classes > 2:
+            # allocate coef_ for multi-class
+            if coef_init is not None:
+                coef_init = np.asarray(coef_init, order="C")
+                if coef_init.shape != (n_classes, n_features):
+                    raise ValueError("Provided coef_ does not match dataset. ")
+                self.coef_ = coef_init
+            else:
+                self.coef_ = np.zeros((n_classes, n_features),
+                                      dtype=np.float64, order="C")
+
+            # allocate intercept_ for multi-class
+            if intercept_init is not None:
+                intercept_init = np.asarray(intercept_init, order="C")
+                if intercept_init.shape != (n_classes, ):
+                    raise ValueError("Provided intercept_init " \
+                                     "does not match dataset.")
+                self.intercept_ = intercept_init
+            else:
+                self.intercept_ = np.zeros(n_classes, dtype=np.float64,
+                                           order="C")
+        else:
+            # allocate coef_ for binary problem
+            if coef_init is not None:
+                coef_init = np.asarray(coef_init, dtype=np.float64,
+                                       order="C")
+                coef_init = coef_init.ravel()
+                if coef_init.shape != (n_features,):
+                    raise ValueError("Provided coef_init does not " \
+                                     "match dataset.")
+                self.coef_ = coef_init
+            else:
+                self.coef_ = np.zeros(n_features, dtype=np.float64, order="C")
+
+            # allocate intercept_ for binary problem
+            if intercept_init is not None:
+                intercept_init = np.asarray(intercept_init, dtype=np.float64)
+                if intercept_init.shape != (1,) and intercept_init.shape != ():
+                    raise ValueError("Provided intercept_init " \
+                                 "does not match dataset.")
+                self.intercept_ = intercept_init.reshape(1,)
+            else:
+                self.intercept_ = np.zeros(1, dtype=np.float64, order="C")
+
+    def _check_fit_data(self, X, y):
+        n_samples, _ = X.shape
+        if n_samples != y.shape[0]:
+            raise ValueError("Shapes of X and y do not match.")
+
+
 def _make_dataset(X, y_i, sample_weight):
     """Returns Dataset object + intercept_decay"""
     if sp.issparse(X):