Source code for traveltimes_prediction.models.algorithms.linear_regression_wrapper
from sklearn.linear_model import LinearRegression
from sklearn.preprocessing import StandardScaler
import numpy as np
from ..base_model import BaseModel
[docs]class LinearRegressionWrapper(LinearRegression, BaseModel):
"""
Class - wrapper for LinearRegression.
"""
name='LinearRegression'
def __init__(self, **kwargs):
"""
Constructor.
:param dict kwargs:
"""
super().__init__(**kwargs)
self.scaler = StandardScaler()
[docs] def fit(self, X, y, sample_weight=None):
"""
Method for fitting of the estimator.
:param numpy.ndarray X:
:param numpy.ndarray y:
:param numpy.ndarray sample_weight:
:return:
"""
self._get_descriptors(X)
self.scaler = self.scaler.fit(X)
X = self.scaler.transform(X)
self.min_y_train = np.percentile(y, 10)
self.max_y_train = 1.5*max(y)
super().fit(X, y, sample_weight)
return self
[docs] def predict(self, X):
"""
Method for the prediction of the output values given the feature vector.
:param numpy.ndarray X:
:return: list
"""
X = self._impute_prediction_sample(X=X)
X = self.scaler.transform(X)
pred = super().predict(X=X)
return self._coerce(pred)
[docs] def dump(self):
"""
Method for dumping of the existing model.
:return: dict
"""
d = dict()
d['model'] = dict()
d['model']['coef_'] = self.coef_.tolist()
d['model']['intercept_'] = self.intercept_.tolist()
d['model']['min_y_train'] = self.min_y_train
d['model']['max_y_train'] = self.max_y_train
d['model']['scaler'] = dict()
d['model']['scaler']['scale_'] = self.scaler.scale_.tolist()
d['model']['scaler']['mean_'] = self.scaler.mean_.tolist()
d['model']['scaler']['var_'] = self.scaler.var_.tolist()
d['model']['scaler']['n_samples_seen_'] = self.scaler.n_samples_seen_
d['model']['_median_imputer'] = self._median_imputer.tolist()
d['model_type'] = self.name
return d
@staticmethod
[docs] def load(model):
"""
Method for recreating model from dumped data.
:param dict model:
:return: LinearRegressionWrapper
"""
inst = LinearRegressionWrapper()
inst.coef_ = np.array(model['coef_'])
inst.intercept_ = np.array(model['intercept_'])
inst.min_y_train = model['min_y_train']
inst.max_y_train = model['max_y_train']
inst.scaler.scale_ = np.array(model['scaler']['scale_'])
inst.scaler.mean_ = np.array(model['scaler']['mean_'])
inst.scaler.var_ = np.array(model['scaler']['var_'])
inst.scaler.n_samples_seen_d = model['scaler']['n_samples_seen_']
inst._median_imputer = np.array(model['_median_imputer'])
return inst