rth
diff --git a/‎examples/robust/plot_robust_regression_california_houses.py
Lines changed: 3 additions & 4 deletions b/‎examples/robust/plot_robust_regression_california_houses.py
Lines changed: 3 additions & 4 deletions
diff --git a/‎sklearn_extra/robust/_robust_weighted_estimator_helper.pyx
Lines changed: 260 additions & 0 deletions b/‎sklearn_extra/robust/_robust_weighted_estimator_helper.pyx
Lines changed: 260 additions & 0 deletions
diff --git a/‎sklearn_extra/robust/mean_estimators.py
Lines changed: 4 additions & 3 deletions b/‎sklearn_extra/robust/mean_estimators.py
Lines changed: 4 additions & 3 deletions
@@ -54,11 +54,10 @@ def quadratic_loss(est, X, y, X_test, y_test):
         "RobustWeightedRegressor",
         RobustWeightedRegressor(
             weighting="huber",
-            c=0.01,
+            c=0.1,
             eta0=1e-2,
             sgd_args={
-                "learning_rate": "adaptive",
-                "eta0": 1e-3,
+                "learning_rate": "invscaling",
             },
         ),
     ),
@@ -89,7 +88,7 @@ def quadratic_loss(est, X, y, X_test, y_test):
         res[i, f, 0] = np.mean(cv)
         res[i, f, 1] = np.median(cv)
 
-fig, (axe1, axe2) = plt.subplots(1, 2)
+fig, (axe1, axe2) = plt.subplots(2, 1)
 names = [name for name, est in estimators]
 
 axe1.boxplot(res[:, :, 0].T, labels=names)
 
@@ -10,6 +10,14 @@ cimport numpy as np
 from sklearn.utils.extmath import row_norms
 from cython cimport floating
 
+import sys
+from time import time
+
+from libc.math cimport exp, log, sqrt, pow, fabs
+cimport numpy as np
+from numpy.math cimport INFINITY
+
+
 # Modified from sklearn.cluster._k_means_fast.pyx
 np.import_array()
 
@@ -73,3 +81,255 @@ cpdef np.ndarray[floating] _kmeans_loss(np.ndarray[floating, ndim=2, mode='c'] X
         j = labels[i]
         inertias[i] = _euclidean_dense_dense(&X[i, 0], &centers[j, 0], n_features)
     return inertias
+
+
+
+
+
+# Regression and Classification losses, from scikit-learn.
+
+
+
+
+# ----------------------------------------
+# Extension Types for Loss Functions
+# ----------------------------------------
+
+cdef class LossFunction:
+    """Base class for convex loss functions"""
+
+    cdef double loss(self, double p, double y) nogil:
+        """Evaluate the loss function.
+
+        Parameters
+        ----------
+        p : double
+            The prediction, p = w^T x
+        y : double
+            The true value (aka target)
+
+        Returns
+        -------
+        double
+            The loss evaluated at `p` and `y`.
+        """
+        return 0.
+
+    def py_dloss(self, double p, double y):
+        """Python version of `dloss` for testing.
+
+        Pytest needs a python function and can't use cdef functions.
+        """
+        return self.dloss(p, y)
+
+    def py_loss(self, double p, double y):
+        """Python version of `dloss` for testing.
+
+        Pytest needs a python function and can't use cdef functions.
+        """
+        return self.loss(p, y)
+
+
+    cdef double dloss(self, double p, double y) nogil:
+        """Evaluate the derivative of the loss function with respect to
+        the prediction `p`.
+
+        Parameters
+        ----------
+        p : double
+            The prediction, p = w^T x
+        y : double
+            The true value (aka target)
+        Returns
+        -------
+        double
+            The derivative of the loss function with regards to `p`.
+        """
+        return 0.
+
+
+cdef class Regression(LossFunction):
+    """Base class for loss functions for regression"""
+
+    cdef double loss(self, double p, double y) nogil:
+        return 0.
+
+    cdef double dloss(self, double p, double y) nogil:
+        return 0.
+
+
+cdef class Classification(LossFunction):
+    """Base class for loss functions for classification"""
+
+    cdef double loss(self, double p, double y) nogil:
+        return 0.
+
+    cdef double dloss(self, double p, double y) nogil:
+        return 0.
+
+
+cdef class ModifiedHuber(Classification):
+    """Modified Huber loss for binary classification with y in {-1, 1}
+
+    This is equivalent to quadratically smoothed SVM with gamma = 2.
+
+    See T. Zhang 'Solving Large Scale Linear Prediction Problems Using
+    Stochastic Gradient Descent', ICML'04.
+    """
+    cdef double loss(self, double p, double y) nogil:
+        cdef double z = p * y
+        if z >= 1.0:
+            return 0.0
+        elif z >= -1.0:
+            return (1.0 - z) * (1.0 - z)
+        else:
+            return -4.0 * z
+
+    cdef double dloss(self, double p, double y) nogil:
+        cdef double z = p * y
+        if z >= 1.0:
+            return 0.0
+        elif z >= -1.0:
+            return 2.0 * (1.0 - z) * -y
+        else:
+            return -4.0 * y
+
+    def __reduce__(self):
+        return ModifiedHuber, ()
+
+
+cdef class Hinge(Classification):
+    """Hinge loss for binary classification tasks with y in {-1,1}
+
+    Parameters
+    ----------
+
+    threshold : float > 0.0
+        Margin threshold. When threshold=1.0, one gets the loss used by SVM.
+        When threshold=0.0, one gets the loss used by the Perceptron.
+    """
+
+    cdef double threshold
+
+    def __init__(self, double threshold=1.0):
+        self.threshold = threshold
+
+    cdef double loss(self, double p, double y) nogil:
+        cdef double z = p * y
+        if z <= self.threshold:
+            return self.threshold - z
+        return 0.0
+
+    cdef double dloss(self, double p, double y) nogil:
+        cdef double z = p * y
+        if z <= self.threshold:
+            return -y
+        return 0.0
+
+    def __reduce__(self):
+        return Hinge, (self.threshold,)
+
+
+cdef class SquaredHinge(Classification):
+    """Squared Hinge loss for binary classification tasks with y in {-1,1}
+
+    Parameters
+    ----------
+
+    threshold : float > 0.0
+        Margin threshold. When threshold=1.0, one gets the loss used by
+        (quadratically penalized) SVM.
+    """
+
+    cdef double threshold
+
+    def __init__(self, double threshold=1.0):
+        self.threshold = threshold
+
+    cdef double loss(self, double p, double y) nogil:
+        cdef double z = self.threshold - p * y
+        if z > 0:
+            return z * z
+        return 0.0
+
+    cdef double dloss(self, double p, double y) nogil:
+        cdef double z = self.threshold - p * y
+        if z > 0:
+            return -2 * y * z
+        return 0.0
+
+    def __reduce__(self):
+        return SquaredHinge, (self.threshold,)
+
+
+cdef class Log(Classification):
+    """Logistic regression loss for binary classification with y in {-1, 1}"""
+
+    cdef double loss(self, double p, double y) nogil:
+        cdef double z = p * y
+        # approximately equal and saves the computation of the log
+        if z > 18:
+            return exp(-z)
+        if z < -18:
+            return -z
+        return log(1.0 + exp(-z))
+
+    cdef double dloss(self, double p, double y) nogil:
+        cdef double z = p * y
+        # approximately equal and saves the computation of the log
+        if z > 18.0:
+            return exp(-z) * -y
+        if z < -18.0:
+            return -y
+        return -y / (exp(z) + 1.0)
+
+    def __reduce__(self):
+        return Log, ()
+
+
+cdef class SquaredLoss(Regression):
+    """Squared loss traditional used in linear regression."""
+    cdef double loss(self, double p, double y) nogil:
+        return 0.5 * (p - y) * (p - y)
+
+    cdef double dloss(self, double p, double y) nogil:
+        return p - y
+
+    def __reduce__(self):
+        return SquaredLoss, ()
+
+
+cdef class Huber(Regression):
+    """Huber regression loss
+
+    Variant of the SquaredLoss that is robust to outliers (quadratic near zero,
+    linear in for large errors).
+
+    https://en.wikipedia.org/wiki/Huber_Loss_Function
+    """
+
+    cdef double c
+
+    def __init__(self, double c):
+        self.c = c
+
+    cdef double loss(self, double p, double y) nogil:
+        cdef double r = p - y
+        cdef double abs_r = fabs(r)
+        if abs_r <= self.c:
+            return 0.5 * r * r
+        else:
+            return self.c * abs_r - (0.5 * self.c * self.c)
+
+    cdef double dloss(self, double p, double y) nogil:
+        cdef double r = p - y
+        cdef double abs_r = fabs(r)
+        if abs_r <= self.c:
+            return r
+        elif r > 0.0:
+            return self.c
+        else:
+            return -self.c
+
+    def __reduce__(self):
+        return Huber, (self.c,)
@@ -118,9 +118,10 @@ def huber(X, c=1.35, T=20):
 
     def psisx(x, c):
         # Huber weight function.
-        res = np.ones(len(x))
-        res[x != 0] = (2 * (x[x != 0] > 0) - 1) * c / x[x != 0]
-        res[np.abs(x) < c] = 1
+        res = np.zeros(len(x))
+        mask = np.abs(x) <= c
+        res[mask] = 1
+        res[~mask] = (c / np.abs(x))[~mask]
         res[~np.isfinite(x)] = 0
         return res