2017-11-18 11:34:07 +08:00
|
|
|
import numpy as np
|
2017-08-19 13:23:00 +08:00
|
|
|
|
|
|
|
""" Here I implemented the scoring functions.
|
|
|
|
MAE, MSE, RMSE, RMSLE are included.
|
|
|
|
|
|
|
|
Those are used for calculating differences between
|
|
|
|
predicted values and actual values.
|
|
|
|
|
|
|
|
Metrics are slightly differentiated. Sometimes squared, rooted,
|
|
|
|
even log is used.
|
|
|
|
|
|
|
|
Using log and roots can be perceived as tools for penalizing big
|
|
|
|
erors. However, using appropriate metrics depends on the situations,
|
|
|
|
and types of data
|
|
|
|
"""
|
|
|
|
|
2019-10-05 13:14:13 +08:00
|
|
|
# Mean Absolute Error
|
2017-08-19 13:23:00 +08:00
|
|
|
def mae(predict, actual):
|
|
|
|
predict = np.array(predict)
|
|
|
|
actual = np.array(actual)
|
|
|
|
|
|
|
|
difference = abs(predict - actual)
|
|
|
|
score = difference.mean()
|
|
|
|
|
|
|
|
return score
|
|
|
|
|
2019-10-05 13:14:13 +08:00
|
|
|
|
|
|
|
# Mean Squared Error
|
2017-08-19 13:23:00 +08:00
|
|
|
def mse(predict, actual):
|
|
|
|
predict = np.array(predict)
|
|
|
|
actual = np.array(actual)
|
|
|
|
|
|
|
|
difference = predict - actual
|
|
|
|
square_diff = np.square(difference)
|
|
|
|
|
|
|
|
score = square_diff.mean()
|
|
|
|
return score
|
|
|
|
|
2019-10-05 13:14:13 +08:00
|
|
|
|
|
|
|
# Root Mean Squared Error
|
2017-08-19 13:23:00 +08:00
|
|
|
def rmse(predict, actual):
|
|
|
|
predict = np.array(predict)
|
|
|
|
actual = np.array(actual)
|
|
|
|
|
|
|
|
difference = predict - actual
|
2017-11-18 11:34:07 +08:00
|
|
|
square_diff = np.square(difference)
|
2017-08-19 13:23:00 +08:00
|
|
|
mean_square_diff = square_diff.mean()
|
|
|
|
score = np.sqrt(mean_square_diff)
|
|
|
|
return score
|
|
|
|
|
2019-10-05 13:14:13 +08:00
|
|
|
|
|
|
|
# Root Mean Square Logarithmic Error
|
2017-08-19 13:23:00 +08:00
|
|
|
def rmsle(predict, actual):
|
|
|
|
predict = np.array(predict)
|
|
|
|
actual = np.array(actual)
|
|
|
|
|
2019-10-05 13:14:13 +08:00
|
|
|
log_predict = np.log(predict + 1)
|
|
|
|
log_actual = np.log(actual + 1)
|
2017-08-19 13:23:00 +08:00
|
|
|
|
|
|
|
difference = log_predict - log_actual
|
|
|
|
square_diff = np.square(difference)
|
|
|
|
mean_square_diff = square_diff.mean()
|
|
|
|
|
|
|
|
score = np.sqrt(mean_square_diff)
|
|
|
|
|
|
|
|
return score
|
2017-11-18 11:34:07 +08:00
|
|
|
|
2019-10-05 13:14:13 +08:00
|
|
|
|
|
|
|
# Mean Bias Deviation
|
2017-11-18 11:34:07 +08:00
|
|
|
def mbd(predict, actual):
|
|
|
|
predict = np.array(predict)
|
|
|
|
actual = np.array(actual)
|
|
|
|
|
|
|
|
difference = predict - actual
|
2019-10-05 13:14:13 +08:00
|
|
|
numerator = np.sum(difference) / len(predict)
|
|
|
|
denumerator = np.sum(actual) / len(predict)
|
2018-01-21 15:25:19 +08:00
|
|
|
print(numerator)
|
|
|
|
print(denumerator)
|
2017-11-18 11:34:07 +08:00
|
|
|
|
|
|
|
score = float(numerator) / denumerator * 100
|
|
|
|
|
2018-01-21 15:25:19 +08:00
|
|
|
return score
|