scikit-learn
diff --git a/‎sklearn/linear_model/logistic.py
Lines changed: 14 additions & 16 deletions b/‎sklearn/linear_model/logistic.py
Lines changed: 14 additions & 16 deletions
diff --git a/‎sklearn/linear_model/tests/test_logistic.py
Lines changed: 49 additions & 5 deletions b/‎sklearn/linear_model/tests/test_logistic.py
Lines changed: 49 additions & 5 deletions
@@ -550,12 +550,12 @@ def logistic_regression_path(X, y, pos_class=None, Cs=10, fit_intercept=True,
         pos_class = classes[1]
 
     # If class_weights is a dict (provided by the user), the weights
-    # are assigned to the original labels. If it is "auto", then
+    # are assigned to the original labels. If it is "balanced", then
     # the class_weights are assigned after masking the labels with a OvR.
     sample_weight = np.ones(X.shape[0])
     le = LabelEncoder()
 
-    if isinstance(class_weight, dict):
+    if isinstance(class_weight, dict) or multi_class == 'multinomial':
         if solver == "liblinear":
             if classes.size == 2:
                 # Reconstruct the weights with keys 1 and -1
@@ -567,7 +567,7 @@ def logistic_regression_path(X, y, pos_class=None, Cs=10, fit_intercept=True,
                                  "solver cannot handle multiclass with "
                                  "class_weight of type dict. Use the lbfgs, "
                                  "newton-cg solvers or set "
-                                 "class_weight='auto'")
+                                 "class_weight='balanced'")
         else:
             class_weight_ = compute_class_weight(class_weight, classes, y)
             sample_weight = class_weight_[le.fit_transform(y)]
@@ -576,13 +576,16 @@ def logistic_regression_path(X, y, pos_class=None, Cs=10, fit_intercept=True,
     # multinomial case this is not necessary.
     if multi_class == 'ovr':
         w0 = np.zeros(n_features + int(fit_intercept))
-        mask_classes = [-1, 1]
+        mask_classes = np.array([-1, 1])
         mask = (y == pos_class)
-        y[mask] = 1
-        y[~mask] = -1
-        # To take care of object dtypes, i.e 1 and -1 are in the form of
-        # strings.
-        y = as_float_array(y, copy=False)
+        y_bin = np.ones(y.shape, dtype=np.float64)
+        y_bin[~mask] = -1.
+        # for compute_class_weight
+
+        if class_weight in ("auto", "balanced"):
+            class_weight_ = compute_class_weight(class_weight, mask_classes,
+                                                 y_bin)
+            sample_weight = class_weight_[le.fit_transform(y_bin)]
 
     else:
         lbin = LabelBinarizer()
@@ -591,11 +594,6 @@ def logistic_regression_path(X, y, pos_class=None, Cs=10, fit_intercept=True,
             Y_bin = np.hstack([1 - Y_bin, Y_bin])
         w0 = np.zeros((Y_bin.shape[1], n_features + int(fit_intercept)),
                       order='F')
-        mask_classes = classes
-
-    if class_weight == "auto":
-        class_weight_ = compute_class_weight(class_weight, mask_classes, y)
-        sample_weight = class_weight_[le.fit_transform(y)]
 
     if coef is not None:
         # it must work both giving the bias term and not
@@ -632,7 +630,7 @@ def logistic_regression_path(X, y, pos_class=None, Cs=10, fit_intercept=True,
             grad = lambda x, *args: _multinomial_loss_grad(x, *args)[1]
             hess = _multinomial_grad_hess
     else:
-        target = y
+        target = y_bin
         if solver == 'lbfgs':
             func = _logistic_loss_and_grad
         elif solver == 'newton-cg':
@@ -664,7 +662,7 @@ def logistic_regression_path(X, y, pos_class=None, Cs=10, fit_intercept=True,
                            tol=tol)
         elif solver == 'liblinear':
             coef_, intercept_, _, = _fit_liblinear(
-                X, y, C, fit_intercept, intercept_scaling, class_weight,
+                X, target, C, fit_intercept, intercept_scaling, class_weight,
                 penalty, dual, verbose, max_iter, tol, random_state)
             if fit_intercept:
                 w0 = np.concatenate([coef_.ravel(), intercept_])
 
@@ -14,6 +14,7 @@
 from sklearn.utils.testing import ignore_warnings
 from sklearn.utils.testing import assert_raise_message
 from sklearn.utils import ConvergenceWarning
+from sklearn.utils import compute_class_weight
 
 from sklearn.linear_model.logistic import (
     LogisticRegression,
@@ -25,7 +26,6 @@
 from sklearn.datasets import load_iris, make_classification
 from sklearn.metrics import log_loss
 
-
 X = [[-1, 0], [0, 1], [1, 1]]
 X_sp = sp.csr_matrix(X)
 Y1 = [0, 1, 1]
@@ -518,12 +518,12 @@ def test_logistic_regressioncv_class_weights():
     X, y = make_classification(n_samples=20, n_features=20, n_informative=10,
                                n_classes=3, random_state=0)
 
-    # Test the liblinear fails when class_weight of type dict is
-    # provided, when it is multiclass. However it can handle
-    # binary problems.
+    msg = ("In LogisticRegressionCV the liblinear solver cannot handle "
+           "multiclass with class_weight of type dict. Use the lbfgs, "
+           "newton-cg solvers or set class_weight='balanced'")
     clf_lib = LogisticRegressionCV(class_weight={0: 0.1, 1: 0.2},
                                    solver='liblinear')
-    assert_raises(ValueError, clf_lib.fit, X, y)
+    assert_raise_message(ValueError, msg, clf_lib.fit, X, y)
     y_ = y.copy()
     y_[y == 2] = 1
     clf_lib.fit(X, y_)
@@ -541,6 +541,50 @@ def test_logistic_regressioncv_class_weights():
     assert_array_almost_equal(clf_lib.coef_, clf_lbf.coef_, decimal=4)
 
 
+def _compute_class_weight_dictionary(y):
+    # compute class_weight and return it as a dictionary
+    classes = np.unique(y)
+    class_weight = compute_class_weight("balanced", classes, y)
+
+    class_weight_dict = {}
+    for (cw, cl) in zip(class_weight, classes):
+        class_weight_dict[cl] = cw
+
+    return class_weight_dict
+
+
+def test_logistic_regression_class_weights():
+    # Multinomial case: remove 90% of class 0
+    X = iris.data[45:, :]
+    y = iris.target[45:]
+    solvers = ("lbfgs", "newton-cg")
+    class_weight_dict = _compute_class_weight_dictionary(y)
+
+    for solver in solvers:
+        clf1 = LogisticRegression(solver=solver, multi_class="multinomial",
+                                  class_weight="balanced")
+        clf2 = LogisticRegression(solver=solver, multi_class="multinomial",
+                                  class_weight=class_weight_dict)
+        clf1.fit(X, y)
+        clf2.fit(X, y)
+        assert_array_almost_equal(clf1.coef_, clf2.coef_, decimal=6)
+
+    # Binary case: remove 90% of class 0 and 100% of class 2
+    X = iris.data[45:100, :]
+    y = iris.target[45:100]
+    solvers = ("lbfgs", "newton-cg", "liblinear")
+    class_weight_dict = _compute_class_weight_dictionary(y)
+
+    for solver in solvers:
+        clf1 = LogisticRegression(solver=solver, multi_class="ovr",
+                                  class_weight="balanced")
+        clf2 = LogisticRegression(solver=solver, multi_class="ovr",
+                                  class_weight=class_weight_dict)
+        clf1.fit(X, y)
+        clf2.fit(X, y)
+        assert_array_almost_equal(clf1.coef_, clf2.coef_, decimal=6)
+
+
 def test_logistic_regression_convergence_warnings():
     # Test that warnings are raised if model does not converge