orchardbirds · orchardbirds · Jul 9, 2021 · Jul 8, 2021 · Jul 8, 2021 · Jul 8, 2021
diff --git a/bokbokbok/eval_metrics/regression/regression_eval_metrics.py b/bokbokbok/eval_metrics/regression/regression_eval_metrics.py
@@ -35,7 +35,7 @@ def RMSPEMetric(XGBoost=False):
     Calculates the Root Mean Squared Percentage Error:
     https://www.kaggle.com/c/optiver-realized-volatility-prediction/overview/evaluation
 
-    There is no loss function for this as the gradient is constant, meaning the Hessian is equal to 0.
+    The corresponding Loss function is Squared Percentage Error.
     Args:
         XGBoost (Bool): Set to True if using XGBoost. We assume LightGBM as default use.
                         Note that you should also set `maximize=False` in the XGBoost train function

diff --git a/bokbokbok/loss_functions/regression/__init__.py b/bokbokbok/loss_functions/regression/__init__.py
@@ -3,8 +3,10 @@
 
 from .regression_loss_functions import (
     LogCoshLoss,
+    SPELoss,
 )
 
 __all__ = [
-    "LogCoshLoss"
+    "LogCoshLoss",
+    "SPELoss",
 ]
diff --git a/bokbokbok/loss_functions/regression/regression_loss_functions.py b/bokbokbok/loss_functions/regression/regression_loss_functions.py
@@ -56,3 +56,56 @@ def log_cosh_loss(
         return grad, hess
 
     return log_cosh_loss
+
+
+def SPELoss():
+    """
+    Squared Percentage Error loss
+    """
+
+    def _gradient(yhat, dtrain):
+        """
+        Compute the gradient squared percentage error.
+        Args:
+            yhat (np.array): Predictions
+            dtrain: The XGBoost / LightGBM dataset
+
+        Returns:
+            SPE Gradient
+        """
+        y = dtrain.get_label()
+        return -2*(y-yhat)/(y**2)
+
+    def _hessian(yhat, dtrain):
+        """
+        Compute the hessian for squared percentage error.
+        Args:
+            yhat (np.array): Predictions
+            dtrain: The XGBoost / LightGBM dataset
+
+        Returns:
+            SPE Hessian
+        """
+        y = dtrain.get_label()
+        return 2/(y**2)
+
+    def squared_percentage(yhat, dtrain):
+        """
+        Calculate gradient and hessian for squared percentage error.
+
+        Args:
+            yhat (np.array): Predictions
+            dtrain: The XGBoost / LightGBM dataset
+
+        Returns:
+            grad: SPE loss gradient
+            hess: SPE loss Hessian
+        """
+        yhat[yhat < -1] = -1 + 1e-6
+        grad = _gradient(yhat, dtrain)
+
+        hess = _hessian(yhat, dtrain)
+
+        return grad, hess
+
+    return squared_percentage
diff --git a/docs/tutorials/RMSPE.ipynb b/docs/tutorials/RMSPE.ipynb
@@ -21,6 +21,7 @@
     "from sklearn.model_selection import train_test_split\n",
     "from sklearn.metrics import mean_absolute_error\n",
     "from bokbokbok.eval_metrics.regression import RMSPEMetric\n",
+    "from bokbokbok.loss_functions.regression import SPELoss\n",
     "\n",
     "X, y = make_regression(n_samples=1000, \n",
     "                       n_features=10, \n",
@@ -56,16 +57,15 @@
     "     'num_leaves': 10,\n",
     "     'learning_rate': 0.1,\n",
     "     'verbose': 10,\n",
-    "     #'objective': 'RMSE',\n",
     "   }\n",
     "\n",
     "clf = lgb.train(params=params,\n",
     "                train_set=train,\n",
     "                valid_sets=[train, valid],\n",
     "                valid_names=['train','valid'],\n",
+    "                fobj=SPELoss(),\n",
     "                feval=RMSPEMetric(),\n",
-    "                early_stopping_rounds=3000,\n",
-    "                verbose_eval=1)\n",
+    "                early_stopping_rounds=3000)\n",
     "\n",
     "mean_absolute_error(y_valid, clf.predict(X_valid))"
    ]
@@ -99,6 +99,7 @@
     "          num_boost_round=3000,\n",
     "          early_stopping_rounds=100,\n",
     "          verbose_eval=100,\n",
+    "                    obj=LogCoshLoss(),\n",
     "          maximize=False,\n",
     "          feval=RMSPEMetric(XGBoost=True),\n",
     "          evals=[(dtrain, 'dtrain'), (dvalid, 'dvalid')])\n",
@@ -128,4 +129,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
+}