Repository URL to install this package:
|
Version:
1.0.0 ▾
|
regression-model
/
pipeline.py
|
|---|
from sklearn.linear_model import Lasso
from sklearn.pipeline import Pipeline
from sklearn.preprocessing import MinMaxScaler
from regression_model.processing import preprocessors as pp
from regression_model.processing import features
from regression_model.config import config
import logging
_logger = logging.getLogger(__name__)
price_pipe = Pipeline(
[
('categorical_imputer',
pp.CategoricalImputer(variables=config.CATEGORICAL_VARS_WITH_NA)),
('numerical_inputer',
pp.NumericalImputer(variables=config.NUMERICAL_VARS_WITH_NA)),
('temporal_variable',
pp.TemporalVariableEstimator(
variables=config.TEMPORAL_VARS,
reference_variable=config.DROP_FEATURES)),
('rare_label_encoder',
pp.RareLabelCategoricalEncoder(
tol=0.01,
variables=config.CATEGORICAL_VARS)),
('categorical_encoder',
pp.CategoricalEncoder(variables=config.CATEGORICAL_VARS)),
('log_transformer',
features.LogTransformer(variables=config.NUMERICALS_LOG_VARS)),
('drop_features',
pp.DropUnecessaryFeatures(variables_to_drop=config.DROP_FEATURES)),
('scaler', MinMaxScaler()),
('Linear_model', Lasso(alpha=0.005, random_state=0))
]
)