The translation of the article was prepared especially for students of the course "Industrial ML on Big Data"
, , . N , , , , - , .
, , , Sklearn, , , , . , AutoVIML Python.
AutoVIML – Python, . , . AutoVIML, , , , – , , .. .
, AutoVIML, , . , , AutoVIML, .
AutoVIML
python-, autoviml
pip
.
pip install autoviml
AutoVIML
from autoviml.Auto_ViML import Auto_ViML
AutoVIML . , Kaggle. .
import pandas as pd
df = pd.read_csv('heart_d.csv')
df
, autoviml
, AutoVIML.
#Basic Example with all parameters
model, features, trainm, testm = Auto_ViML(
train,
target,
test,
sample_submission,
hyper_param="GS",
feature_reduction=True,
scoring_parameter="weighted-f1",
KMeans_Featurizer=False,
Boosting_Flag=False,
Binning_Flag=False,
Add_Poly=False,
Stacking_Flag=False,
Imbalanced_Flag=False,
verbose=0,
)
, AutoVIML, . , .
train
: , dataframe, dataframe. dataframe «df», «df».target
: . «TenYearCHD».test
: . ( ””), , AutoVIML .sample_submission
: , .hyper_param
: RandomizedSearchCV, , Grid Search CV. «RS».feature_reduction
: true, .scoring_parameter
: , . «Weighted-f1».KMeans_featurizer
: true false XGboost , .boosting_flag
: . false.binning_flag
: false, true, .add_poly
: false.stacking_flag
: false. true, , . false.Imbalanced_flag
: true, SMOTING.Verbose
: . 3.
AutoVIML.
model, features, trainm, testm = Auto_ViML(
train=df,
target="TenYearCHD",
test="",
sample_submission="",
hyper_param="RS",
feature_reduction=True,
scoring_parameter="weighted-f1",
KMeans_Featurizer=False,
Boosting_Flag=True,
Binning_Flag=False,
Add_Poly=False,
Stacking_Flag=True,
Imbalanced_Flag=True,
verbose=3
)
.
1.
2.
3.
4.
5.
6.
, AutoVIML , , .
, AutoVIML, , . AutoVIML – , .