diff --git a/examples/PyCaret 2 Anomaly Detection.ipynb b/examples/PyCaret 2 Anomaly Detection.ipynb index 8797391f88e0086e73ce577b0e95e9f776aeab21..903567c24d2a355eae1ece2817a24001d82c68f6 100644 --- a/examples/PyCaret 2 Anomaly Detection.ipynb +++ b/examples/PyCaret 2 Anomaly Detection.ipynb @@ -16180,9785 +16180,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "# 10. Get System Logs" - ] - }, - { - "cell_type": "code", - "execution_count": 20, - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '40', '51,509', 'INFO', 'PyCaret Classification Module']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'version 2.0']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'USI', '1cda']\n", - "['2020-07-31 01', '40', '51,510', 'INFO', 'setup(data=(1070, 19), target=Purchase, train_size=0.7, sampling=True, sample_estimator=None, categorical_features=None, categorical_imputation=constant, ordinal_features=None,']\n", - "['high_cardinality_features=None, high_cardinality_method=frequency, numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None, remove_outliers=False, outliers_threshold=0.05,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, remove_perfect_collinearity=False, create_clusters=False, cluster_iter=20,']\n", - "['polynomial_features=False, polynomial_degree=2, trigonometry_features=False, polynomial_threshold=0.1, group_features=None,']\n", - "['group_names=None, feature_selection=False, feature_selection_threshold=0.8, feature_interaction=False, feature_ratio=False, interaction_threshold=0.01,']\n", - "['fix_imbalance=False, fix_imbalance_method=None, data_split_shuffle=True, folds_shuffle=False, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=juice1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 01', '40', '51,526', 'INFO', 'Checking environment']\n", - "['2020-07-31 01', '40', '51,526', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Memory', 'svmem(total=17032478720, available=12121403392, percent=28.8, used=4911075328, free=12121403392)']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Checking libraries']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 01', '40', '55,335', 'INFO', 'sklearn==0.23.1']\n", - "['2020-07-31 01', '40', '55,728', 'INFO', 'xgboost==0.90']\n", - "['2020-07-31 01', '40', '56,084', 'INFO', 'lightgbm==2.3.1']\n", - "['2020-07-31 01', '40', '56,736', 'INFO', 'catboost==0.20.2']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'mlflow==1.8.0']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Checking Exceptions']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '41', '00,697', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '41', '10,136', 'INFO', 'Copying data for preprocessing']\n", - "['2020-07-31 01', '41', '10,136', 'INFO', 'Declaring global variables']\n", - "['2020-07-31 01', '41', '10,162', 'INFO', 'Declaring preprocessing parameters']\n", - "['2020-07-31 01', '41', '10,162', 'INFO', 'Importing preprocessing module']\n", - "['2020-07-31 01', '41', '14,303', 'INFO', 'Creating preprocessing pipeline']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Preprocessing pipeline created successfully']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Creating grid variables']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Creating global containers']\n", - "['2020-07-31 01', '41', '16,270', 'INFO', 'Logging experiment in MLFlow']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False)]']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'create_model_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'master_model_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'display_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False)']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'setup() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'compare_models(blacklist=None, whitelist=None, fold=10, round=4, sort=Accuracy, n_select=1, turbo=True, verbose=True)']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '41', '23,820', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '41', '23,820', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '41', '23,838', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '41', '23,839', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '41', '23,910', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 01', '41', '23,922', 'INFO', 'Import successful']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Initializing Logistic Regression']\n", - "['2020-07-31 01', '41', '23,934', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '23,940', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '23,996', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,003', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,007', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '24,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,057', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,064', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,068', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '24,073', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,111', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,118', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,122', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '24,127', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,168', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,174', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,178', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '24,182', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,224', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,230', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,235', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '24,240', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,279', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,286', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,290', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '24,296', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,338', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,345', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,349', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '24,354', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,391', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,398', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,402', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '24,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,447', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,453', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,457', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '24,462', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,503', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,514', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '24,514', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '24,523', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'save_model(model=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '24,644', 'INFO', 'Initializing K Neighbors Classifier']\n", - "['2020-07-31 01', '41', '24,647', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '24,647', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,685', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,905', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,911', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '24,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,922', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,165', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,173', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '25,180', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,185', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,410', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,415', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '25,422', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,427', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,652', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,652', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '25,672', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,676', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,941', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,956', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '25,956', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,972', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,219', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,235', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '26,235', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,249', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,490', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,490', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '26,510', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,514', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,744', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,750', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '26,756', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,760', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,998', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,007', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,019', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,243', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,248', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '27,249', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '27,259', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '27,319', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '27,319', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '27,320', 'INFO', \"save_model(model=KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '27,320', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '27,330', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '27,338', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform')]\"]\n", - "['2020-07-31 01', '41', '27,338', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '27,338', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '27,380', 'INFO', 'Initializing Naive Bayes']\n", - "['2020-07-31 01', '41', '27,380', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '27,396', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,398', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,405', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,410', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '27,415', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,418', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,424', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,429', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '27,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,437', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,444', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,449', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '27,455', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,458', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,465', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,469', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '27,475', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,484', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,489', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '27,494', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,504', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,509', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '27,514', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,517', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,525', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,530', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '27,535', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,538', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,545', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,550', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '27,556', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,559', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,566', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,570', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,576', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,585', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,590', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '27,590', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '27,600', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'save_model(model=GaussianNB(priors=None, var_smoothing=1e-09), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), GaussianNB(priors=None, var_smoothing=1e-09)]']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '27,707', 'INFO', 'Initializing Decision Tree Classifier']\n", - "['2020-07-31 01', '41', '27,712', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '27,718', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,766', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,778', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '27,783', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,794', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,799', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '27,806', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,811', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,817', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,825', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '27,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,847', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,853', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '27,860', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,866', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,873', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,879', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '27,886', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,891', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,899', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,904', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '27,912', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,917', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,926', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,931', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '27,938', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,944', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,951', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,957', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '27,962', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,967', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,982', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,987', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,993', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,000', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,006', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,006', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,017', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,076', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,076', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,077', 'INFO', \"save_model(model=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '28,077', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,082', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,086', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')]\"]\n", - "['2020-07-31 01', '41', '28,087', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,087', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,135', 'INFO', 'Initializing SVM - Linear Kernel']\n", - "['2020-07-31 01', '41', '28,141', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '28,147', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,188', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,188', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,191', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,193', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,198', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '28,204', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,212', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,215', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,217', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,222', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '28,227', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,235', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,235', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,238', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,240', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,245', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '28,250', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,256', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,256', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,259', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,262', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,266', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '28,272', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,276', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,279', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,281', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,286', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '28,291', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,297', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,297', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,300', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,302', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,307', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '28,312', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,319', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,319', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,322', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,324', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,329', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '28,334', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,341', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,341', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,344', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,346', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,350', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '28,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,364', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,364', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,367', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,374', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '28,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,386', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,386', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,389', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,391', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,396', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,396', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,407', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,473', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'save_model(model=SGDClassifier(alpha=0.0001, average=False, class_weight=None,']\n", - "['early_stopping=False, epsilon=0.1, eta0=0.0, fit_intercept=True,']\n", - "[\"l1_ratio=0.15, learning_rate='optimal', loss='hinge',\"]\n", - "[\"max_iter=1000, n_iter_no_change=5, n_jobs=-1, penalty='l2',\"]\n", - "['power_t=0.5, random_state=123, shuffle=True, tol=0.001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,479', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), SGDClassifier(alpha=0.0001, average=False, class_weight=None,']\n", - "['early_stopping=False, epsilon=0.1, eta0=0.0, fit_intercept=True,']\n", - "[\"l1_ratio=0.15, learning_rate='optimal', loss='hinge',\"]\n", - "[\"max_iter=1000, n_iter_no_change=5, n_jobs=-1, penalty='l2',\"]\n", - "['power_t=0.5, random_state=123, shuffle=True, tol=0.001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False)]']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,532', 'INFO', 'Initializing Ridge Classifier']\n", - "['2020-07-31 01', '41', '28,532', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '28,547', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,630', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,630', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,646', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,662', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,662', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,665', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,667', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,676', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '28,683', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,687', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,687', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,690', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,692', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,697', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '28,706', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,711', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,711', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,713', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,715', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,720', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '28,726', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,730', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,730', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,733', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,735', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,739', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '28,744', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,748', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,749', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,751', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,754', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,759', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '28,764', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,768', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,768', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,771', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,778', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '28,784', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,788', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,791', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,793', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,799', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '28,804', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,809', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,809', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,813', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,816', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,821', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '28,827', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,831', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,831', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,834', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,836', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,841', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,841', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,853', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,934', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,935', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,935', 'INFO', 'save_model(model=RidgeClassifier(alpha=1.0, class_weight=None, copy_X=True, fit_intercept=True,']\n", - "[\"max_iter=None, normalize=False, random_state=123, solver='auto',\"]\n", - "['tol=0.001), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '28,935', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,940', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RidgeClassifier(alpha=1.0, class_weight=None, copy_X=True, fit_intercept=True,']\n", - "[\"max_iter=None, normalize=False, random_state=123, solver='auto',\"]\n", - "['tol=0.001)]']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,994', 'INFO', 'Initializing Random Forest Classifier']\n", - "['2020-07-31 01', '41', '29,000', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '29,006', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,127', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '29,363', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '29,378', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '29,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,496', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '29,712', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '29,716', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '29,723', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,834', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,077', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,087', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '30,095', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,207', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,439', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,448', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '30,455', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,569', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,799', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,799', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '30,814', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,933', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,175', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '31,183', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '31,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,538', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,547', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '31,553', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '31,666', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,902', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,913', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '31,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,034', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,387', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,626', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,630', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '32,630', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '32,642', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '32,760', 'INFO', 'Initializing Quadratic Discriminant Analysis']\n", - "['2020-07-31 01', '41', '32,776', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '32,776', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,838', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,838', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,948', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,948', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,948', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,995', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,995', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '33,010', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,010', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,023', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,029', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '33,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,039', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,045', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,050', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '33,050', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '33,062', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'save_model(model=QuadraticDiscriminantAnalysis(priors=None, reg_param=0.0,']\n", - "['store_covariance=False, tol=0.0001), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), QuadraticDiscriminantAnalysis(priors=None, reg_param=0.0,']\n", - "['store_covariance=False, tol=0.0001)]']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '33,161', 'INFO', 'Initializing Ada Boost Classifier']\n", - "['2020-07-31 01', '41', '33,161', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '33,177', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,239', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,255', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,255', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '33,270', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,333', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,348', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,348', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '33,364', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,427', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,442', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,442', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '33,458', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,520', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,536', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,552', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '33,552', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,614', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,649', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,655', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '33,660', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,730', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,746', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,761', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '33,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,839', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,855', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,855', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '33,871', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,933', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,949', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,964', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '33,964', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,027', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,136', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '34,171', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '34,240', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123)]']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '34,314', 'INFO', 'Initializing Gradient Boosting Classifier']\n", - "['2020-07-31 01', '41', '34,322', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '34,328', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,447', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,455', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,460', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '34,466', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,582', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,589', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,594', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '34,600', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,726', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,733', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,739', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '34,745', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,851', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,868', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,872', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '34,877', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,995', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,002', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,008', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '35,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,134', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,142', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,146', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '35,151', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,277', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,284', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,290', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '35,296', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,398', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,398', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,413', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '35,413', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,532', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,539', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,545', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '35,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,674', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,680', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,686', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '35,686', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '35,699', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', \"save_model(model=GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '35,814', 'INFO', 'Initializing Linear Discriminant Analysis']\n", - "['2020-07-31 01', '41', '35,832', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '35,838', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,848', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,855', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,860', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '35,865', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,873', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,880', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,885', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '35,890', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,900', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,906', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,911', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '35,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,924', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,931', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,936', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '35,941', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,949', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,956', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,960', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '35,966', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,973', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,980', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,985', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '35,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,999', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,005', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,013', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '36,021', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,031', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,037', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,043', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '36,048', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,055', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,062', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,066', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '36,071', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,079', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,086', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,091', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '36,091', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '36,103', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '36,160', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '36,160', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '36,161', 'INFO', 'save_model(model=LinearDiscriminantAnalysis(n_components=None, priors=None, shrinkage=None,']\n", - "[\"solver='svd', store_covariance=False, tol=0.0001), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '36,161', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '36,165', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '36,168', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LinearDiscriminantAnalysis(n_components=None, priors=None, shrinkage=None,']\n", - "[\"solver='svd', store_covariance=False, tol=0.0001)]\"]\n", - "['2020-07-31 01', '41', '36,168', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '36,168', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '36,199', 'INFO', 'Initializing Extra Trees Classifier']\n", - "['2020-07-31 01', '41', '36,215', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '36,221', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,359', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,592', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,602', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '36,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,759', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,983', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '36,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,131', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '37,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '37,369', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '37,390', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,529', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '37,769', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '37,769', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '37,792', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,934', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,165', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,181', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '38,181', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '38,333', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,572', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,572', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '38,588', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '38,732', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,984', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,994', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '39,003', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,164', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '39,413', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '39,419', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '39,419', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,586', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '39,808', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '39,808', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '39,823', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,966', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '40,211', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'save_model(model=ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '40,333', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '40,395', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 01', '41', '40,395', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '40,410', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,501', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,532', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '40,537', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,584', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,603', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '40,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,655', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,667', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,678', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '40,687', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,727', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,740', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,751', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '40,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,800', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,813', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,820', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '40,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,873', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,886', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,897', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '40,906', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,946', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,959', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,970', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '40,980', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,020', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,032', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,043', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '41,054', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,096', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,109', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,119', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '41,128', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,175', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,188', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,199', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '41,199', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '41,228', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '41,348', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', \"save_model(model=XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '41,358', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)]']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '41,423', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 01', '41', '41,429', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '41,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,515', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,533', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,544', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '41,554', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,628', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,645', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,656', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '41,665', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,734', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,737', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,753', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '41,769', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,837', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,838', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,853', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '41,873', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,936', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,937', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,953', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '41,972', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,047', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,063', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,074', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '42,084', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,180', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '42,196', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,208', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '42,218', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,287', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,302', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,318', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '42,318', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,380', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,412', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,412', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '42,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,502', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,519', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,530', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '42,531', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '42,561', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '42,651', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '42,651', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '42,652', 'INFO', \"save_model(model=LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '42,652', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '42,663', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '42,777', 'INFO', 'Initializing CatBoost Classifier']\n", - "['2020-07-31 01', '41', '42,783', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '42,789', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '45,155', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '45,194', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '45,199', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '45,205', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '47,070', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '48,735', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '48,751', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '48,751', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '48,764', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '50,511', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '50,526', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '50,542', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '50,542', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '52,170', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '52,170', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '52,186', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '52,193', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '53,805', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '53,820', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '53,820', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '53,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '55,391', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '55,391', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '55,407', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '55,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '56,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '56,994', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '56,994', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '57,008', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '58,639', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '58,654', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '58,670', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '58,670', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,228', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '00,260', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '00,317', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '00,317', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '00,318', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '00,318', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '00,325', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ]']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '00,375', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 01', '42', '00,375', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'create_model(estimator=lr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '00,395', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '00,396', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,435', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,441', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,445', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '00,445', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,476', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,476', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,492', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '00,492', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,523', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,585', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,585', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,601', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '00,601', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,632', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,679', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,882', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,882', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'display_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '00,999', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 01', '42', '00,999', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'display_container', '2']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'create_model(estimator=lr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '01,010', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '01,033', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '01,034', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '01,035', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '01,035', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '01,039', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '01,039', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '01,040', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '01,046', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '01,050', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,094', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,101', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,113', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '01,118', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,160', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,166', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,180', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '01,185', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,230', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,236', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,248', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '01,253', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,301', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,314', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '01,322', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,368', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,374', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,378', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '01,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,432', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,438', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,444', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '01,444', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,503', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,511', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '01,511', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,561', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,568', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,582', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '01,587', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,626', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,633', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,646', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '01,651', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,694', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,700', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,715', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '01,716', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '01,724', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '01,766', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '01,930', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'save_model(model=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '01,936', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '01,960', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '01,960', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'create_model_container', '2']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'master_model_container', '2']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'display_container', '3']\n", - "['2020-07-31 01', '42', '01,994', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '01,994', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,000', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '02,000', 'INFO', 'create_model(estimator=dt, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '02,022', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '02,027', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '02,027', 'INFO', 'Decision Tree Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '02,028', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '02,035', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '02,040', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,046', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,054', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,069', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '02,073', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,078', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,085', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,099', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '02,104', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,108', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,115', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,133', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '02,137', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,143', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,149', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,165', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '02,170', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,174', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,198', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '02,204', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,208', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,216', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,234', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '02,239', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,244', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,252', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,268', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '02,273', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,279', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,290', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,307', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '02,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,326', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,342', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '02,347', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,352', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,360', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,376', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '02,377', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '02,385', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '02,390', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', \"save_model(model=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '02,526', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '02,530', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')]\"]\n", - "['2020-07-31 01', '42', '02,530', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,530', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '02,545', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '02,545', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'create_model_container', '3']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'master_model_container', '3']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'display_container', '4']\n", - "['2020-07-31 01', '42', '02,584', 'INFO', \"DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')\"]\n", - "['2020-07-31 01', '42', '02,584', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'create_model(estimator=rf, ensemble=False, method=None, fold=5, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '02,592', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '02,592', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '02,613', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '02,614', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '02,615', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '02,615', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '02,619', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '02,620', 'INFO', 'Random Forest Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '02,620', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '02,626', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '02,631', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,758', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,028', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '03,034', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,159', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,378', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,408', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '03,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,526', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,754', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,773', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '03,778', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,894', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '04,129', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '04,146', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '04,146', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '04,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '04,495', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '04,517', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '04,518', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '04,524', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '04,642', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '05,065', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '05,065', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'create_model_container', '4']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'master_model_container', '4']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'display_container', '5']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '05,131', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 01', '42', '05,131', 'INFO', \"compare_models(blacklist=None, whitelist=['rf', 'ada', 'gbc', 'et', 'xgboost', 'lightgbm', 'catboost'], fold=3, round=4, sort=Accuracy, n_select=1, turbo=True, verbose=True)\"]\n", - "['2020-07-31 01', '42', '05,131', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '05,132', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '05,132', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '05,155', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '05,156', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '05,160', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 01', '42', '05,160', 'INFO', 'Import successful']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Initializing Random Forest Classifier']\n", - "['2020-07-31 01', '42', '05,172', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '05,179', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '05,293', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '05,535', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '05,535', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '05,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '05,676', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '05,894', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '05,894', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '05,910', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,026', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '06,273', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '06,339', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '06,339', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '06,340', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '06,340', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '06,400', 'INFO', 'Initializing Ada Boost Classifier']\n", - "['2020-07-31 01', '42', '06,405', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '06,411', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,575', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,581', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,596', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '06,596', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,670', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '06,696', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123)]']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '06,825', 'INFO', 'Initializing Gradient Boosting Classifier']\n", - "['2020-07-31 01', '42', '06,825', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '06,841', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,929', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,929', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,944', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '06,944', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,030', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,146', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '07,241', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '07,241', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '07,242', 'INFO', \"save_model(model=GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '07,242', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '07,249', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '07,294', 'INFO', 'Initializing Extra Trees Classifier']\n", - "['2020-07-31 01', '42', '07,294', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '07,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,694', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,694', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '07,694', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,859', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,277', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '08,511', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'save_model(model=ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '08,705', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 01', '42', '08,721', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '08,727', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,759', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,781', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '08,794', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,828', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,842', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,853', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '08,864', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,900', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,913', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,924', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '08,925', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '08,947', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', \"save_model(model=XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)]']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '09,201', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 01', '42', '09,216', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '09,222', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,282', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,297', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '09,314', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,375', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,381', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,397', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '09,413', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,466', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '09,514', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', \"save_model(model=LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '09,613', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '09,722', 'INFO', 'Initializing CatBoost Classifier']\n", - "['2020-07-31 01', '42', '09,733', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '09,738', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '11,485', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '11,485', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '11,501', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '11,508', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '13,655', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '13,671', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '13,671', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '13,686', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '15,832', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '15,844', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '15,851', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '15,851', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '15,867', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '15,935', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '15,944', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ]']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '16,009', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 01', '42', '16,009', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'create_model(estimator=xgboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '16,024', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '16,024', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '16,025', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Extreme Gradient Boosting Imported succesfully']\n", - "['2020-07-31 01', '42', '16,027', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '16,030', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '16,031', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,079', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,084', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,099', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '16,099', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,177', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '16,177', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,224', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,240', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,256', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '16,271', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,334', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,349', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '16,349', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,396', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,412', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,427', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '16,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,474', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,490', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,505', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '16,521', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,584', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,599', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '16,599', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,646', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,662', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,677', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '16,693', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,740', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,755', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,771', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '16,771', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,834', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,849', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,865', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '16,865', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '16,880', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'display_container', '6']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', \"XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'display_container', '7']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', \"XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '17,048', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 01', '42', '17,049', 'INFO', 'tune_model(estimator=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), fold=10, round=4, n_iter=10, custom_grid=None, optimize=Accuracy, choose_better=False, verbose=True)']\n", - "['2020-07-31 01', '42', '17,049', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '17,051', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '17,051', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '17,077', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '17,078', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '17,078', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '17,079', 'INFO', 'Base model', 'Logistic Regression']\n", - "['2020-07-31 01', '42', '17,080', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '17,080', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '17,088', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 01', '42', '17,088', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 01', '42', '20,205', 'INFO', 'Random search completed']\n", - "['2020-07-31 01', '42', '20,213', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '20,220', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,253', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,261', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,282', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '20,289', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,320', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,328', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,347', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '20,354', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,386', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,394', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,414', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '20,420', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,451', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,460', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,478', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '20,484', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,516', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,525', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,543', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '20,549', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,589', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,609', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '20,615', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,651', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,661', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,683', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '20,689', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,723', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,732', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,756', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '20,762', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,796', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,805', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,825', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '20,832', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,863', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,872', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,894', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '20,895', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '20,904', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '20,934', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '20,934', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '20,935', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '21,014', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'create_model_container', '6']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'master_model_container', '6']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'display_container', '8']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '21,242', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 01', '42', '21,243', 'INFO', 'tune_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), fold=10, round=4, n_iter=10, custom_grid=None, optimize=Accuracy, choose_better=False, verbose=True)']\n", - "['2020-07-31 01', '42', '21,243', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '21,244', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '21,244', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '21,264', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '21,265', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '21,265', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Base model', 'Random Forest Classifier']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '21,272', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 01', '42', '21,272', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 01', '42', '22,790', 'INFO', 'Random search completed']\n", - "['2020-07-31 01', '42', '22,816', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '22,831', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '22,955', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,185', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,211', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '23,217', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '23,340', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,563', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,582', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '23,586', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '23,716', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,951', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,968', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '23,974', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,091', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '24,320', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '24,351', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '24,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,483', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '24,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '24,742', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '24,747', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,866', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,117', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,141', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '25,146', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '25,283', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,518', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,542', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '25,547', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '25,666', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,919', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,938', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '25,938', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '26,084', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '26,312', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '26,334', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '26,338', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '26,457', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '26,677', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '26,699', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '26,700', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '26,707', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '26,829', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '26,830', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '26,830', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '26,911', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '26,911', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '26,912', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '26,912', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '26,927', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'create_model_container', '7']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'master_model_container', '7']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'display_container', '9']\n", - "['2020-07-31 01', '42', '27,310', 'INFO', 'RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '27,310', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '27,315', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', \"ensemble_model(estimator=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Bagging, fold=10, n_estimators=10, round=4, choose_better=False, optimize=Accuracy, verbose=True)\"]\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '27,335', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '27,335', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '27,336', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '27,337', 'INFO', 'Base model', 'Decision Tree Classifier']\n", - "['2020-07-31 01', '42', '27,341', 'INFO', 'Importing untrained ensembler']\n", - "['2020-07-31 01', '42', '27,342', 'INFO', 'BaggingClassifier() succesfully imported']\n", - "['2020-07-31 01', '42', '27,347', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '27,347', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '27,349', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '27,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,384', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,416', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,430', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '27,435', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,487', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,504', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '27,509', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,534', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,567', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,582', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '27,587', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,612', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,644', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,658', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '27,663', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,686', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,733', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '27,738', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,764', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,799', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,816', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '27,822', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,852', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,892', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,904', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '27,904', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,938', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,970', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,985', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '27,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,015', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,047', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,062', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '28,067', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,139', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '28,140', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '28,150', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '28,173', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '28,173', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '28,174', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '28,239', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '28,239', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '28,240', 'INFO', 'save_model(model=BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '28,240', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '28,250', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)]']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '28,419', 'INFO', 'create_model_container', '8']\n", - "['2020-07-31 01', '42', '28,420', 'INFO', 'master_model_container', '8']\n", - "['2020-07-31 01', '42', '28,420', 'INFO', 'display_container', '10']\n", - "['2020-07-31 01', '42', '28,421', 'INFO', 'BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)']\n", - "['2020-07-31 01', '42', '28,421', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '28,427', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 01', '42', '28,428', 'INFO', \"ensemble_model(estimator=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Boosting, fold=10, n_estimators=10, round=4, choose_better=False, optimize=Accuracy, verbose=True)\"]\n", - "['2020-07-31 01', '42', '28,428', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '28,428', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '28,429', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '28,447', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '28,447', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '28,449', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '28,452', 'INFO', 'Base model', 'Decision Tree Classifier']\n", - "['2020-07-31 01', '42', '28,456', 'INFO', 'Importing untrained ensembler']\n", - "['2020-07-31 01', '42', '28,457', 'INFO', 'AdaBoostClassifier() succesfully imported']\n", - "['2020-07-31 01', '42', '28,463', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '28,463', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '28,464', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '28,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,508', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,531', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '28,536', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,577', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,591', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '28,597', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,634', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,644', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,659', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '28,665', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,708', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,735', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '28,741', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,778', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,789', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,809', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '28,817', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,858', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,868', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,885', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '28,891', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,920', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,933', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,953', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '28,960', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,003', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,013', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,028', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '29,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,071', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,082', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,099', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '29,103', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,134', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,144', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,161', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '29,162', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '29,174', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '29,219', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '29,219', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '29,220', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '29,282', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '29,282', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '29,283', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '29,283', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '29,297', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '29,304', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123)]']\n", - "['2020-07-31 01', '42', '29,304', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '29,304', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '29,449', 'INFO', 'create_model_container', '9']\n", - "['2020-07-31 01', '42', '29,449', 'INFO', 'master_model_container', '9']\n", - "['2020-07-31 01', '42', '29,449', 'INFO', 'display_container', '11']\n", - "['2020-07-31 01', '42', '29,450', 'INFO', \"AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123)']\n", - "['2020-07-31 01', '42', '29,450', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '29,456', 'INFO', 'Initializing blend_models()']\n", - "['2020-07-31 01', '42', '29,459', 'INFO', \"blend_models(estimator_list=[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)], fold=10, round=4, choose_better=False, optimize=Accuracy, method=soft, turbo=True, verbose=True)']\n", - "['2020-07-31 01', '42', '29,459', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '29,461', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '29,461', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '29,481', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '29,481', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '29,482', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '29,482', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '29,486', 'INFO', 'Defining model names in estimator_list']\n", - "['2020-07-31 01', '42', '29,656', 'INFO', 'n_jobs multiple passed']\n", - "['2020-07-31 01', '42', '29,664', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '29,672', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,826', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '30,112', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '30,136', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '30,147', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '30,300', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '30,559', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '30,571', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '30,576', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '30,719', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '30,986', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '31,001', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '31,007', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '31,147', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '31,442', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '31,460', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '31,466', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '31,602', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '31,896', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '31,921', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '31,927', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '32,074', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '32,325', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '32,340', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '32,346', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '32,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '32,810', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '32,826', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '32,836', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '32,985', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '33,258', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '33,272', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '33,281', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '33,422', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '33,716', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '33,731', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '33,736', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '33,878', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '34,182', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '34,205', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '34,206', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '34,219', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '34,367', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '34,368', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '34,368', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '34,421', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '34,422', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '34,429', 'INFO', \"save_model(model=VotingClassifier(estimators=[('Bagging Classifier_1',\"]\n", - "['BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['r...']\n", - "['max_depth=30,']\n", - "[\"max_features='auto',\"]\n", - "['max_leaf_nodes=None,']\n", - "['max_samples=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False,']\n", - "['random_state=123,']\n", - "['verbose=0,']\n", - "['warm_start=False))],']\n", - "['flatten_transform=True, n_jobs=-1, verbose=False,']\n", - "[\"voting='soft', weights=None), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '42', '34,429', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '34,478', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '34,488', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), VotingClassifier(estimators=[('Bagging Classifier_1',\"]\n", - "['BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['r...']\n", - "['max_depth=30,']\n", - "[\"max_features='auto',\"]\n", - "['max_leaf_nodes=None,']\n", - "['max_samples=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False,']\n", - "['random_state=123,']\n", - "['verbose=0,']\n", - "['warm_start=False))],']\n", - "['flatten_transform=True, n_jobs=-1, verbose=False,']\n", - "[\"voting='soft', weights=None)]\"]\n", - "['2020-07-31 01', '42', '34,489', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '34,489', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '34,946', 'INFO', 'create_model_container', '10']\n", - "['2020-07-31 01', '42', '34,947', 'INFO', 'master_model_container', '10']\n", - "['2020-07-31 01', '42', '34,947', 'INFO', 'display_container', '12']\n", - "['2020-07-31 01', '42', '34,953', 'INFO', \"VotingClassifier(estimators=[('Bagging Classifier_1',\"]\n", - "['BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['r...']\n", - "['max_depth=30,']\n", - "[\"max_features='auto',\"]\n", - "['max_leaf_nodes=None,']\n", - "['max_samples=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False,']\n", - "['random_state=123,']\n", - "['verbose=0,']\n", - "['warm_start=False))],']\n", - "['flatten_transform=True, n_jobs=-1, verbose=False,']\n", - "[\"voting='soft', weights=None)\"]\n", - "['2020-07-31 01', '42', '34,954', 'INFO', 'blend_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '34,961', 'INFO', 'Initializing stack_models()']\n", - "['2020-07-31 01', '42', '34,963', 'INFO', \"stack_models(estimator_list=[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)], meta_model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), fold=10, round=4, method=soft, restack=True, plot=False, choose_better=False, optimize=Accuracy, finalize=False, verbose=True)']\n", - "['2020-07-31 01', '42', '34,964', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '34,965', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '34,965', 'INFO', 'Copying estimator list']\n", - "['2020-07-31 01', '42', '34,970', 'INFO', 'Defining meta model']\n", - "['2020-07-31 01', '42', '34,972', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '34,990', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '34,991', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '34,993', 'INFO', 'Getting model names']\n", - "['2020-07-31 01', '42', '34,995', 'INFO', 'Checking base model', 'AdaBoostClassifier']\n", - "['2020-07-31 01', '42', '34,999', 'INFO', 'Fitting base model']\n", - "['2020-07-31 01', '42', '35,039', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 01', '42', '35,373', 'INFO', 'Checking base model', 'BaggingClassifier']\n", - "['2020-07-31 01', '42', '35,378', 'INFO', 'Fitting base model']\n", - "['2020-07-31 01', '42', '35,408', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 01', '42', '35,751', 'INFO', 'Checking base model', 'RandomForestClassifier']\n", - "['2020-07-31 01', '42', '35,751', 'INFO', 'Fitting base model']\n", - "['2020-07-31 01', '42', '35,872', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 01', '42', '37,647', 'INFO', 'Base layer complete']\n", - "['2020-07-31 01', '42', '37,802', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '37,804', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '37,809', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '37,921', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '38,152', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '38,166', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '38,172', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '38,289', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '38,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '38,540', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '38,554', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '38,673', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '38,892', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '38,922', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '38,929', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '39,040', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '39,259', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '39,274', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '39,286', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '39,406', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '39,641', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '39,660', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '39,660', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '39,792', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '40,042', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '40,064', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '40,070', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '40,189', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '40,439', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '40,454', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '40,461', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '40,574', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '40,793', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '40,808', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '40,816', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '40,938', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '41,188', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '41,209', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '41,215', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '41,339', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '41,557', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '41,572', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '41,572', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '41,583', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '41,583', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '41,583', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '41,658', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '41,658', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '41,658', 'INFO', \"save_model(model=[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True], model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '42', '41,658', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '41,674', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '41,690', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), [AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True]]\"]\n", - "['2020-07-31 01', '42', '41,690', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '41,690', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'create_model_container', '11']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'master_model_container', '11']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'display_container', '13']\n", - "['2020-07-31 01', '42', '42,224', 'INFO', \"[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True]\"]\n", - "['2020-07-31 01', '42', '42,224', 'INFO', 'stack_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '42,230', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '42,231', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=auc, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '42,231', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'plot type', 'auc']\n", - "['2020-07-31 01', '42', '42,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '42,413', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '42', '42,806', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '42,806', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '42,819', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '42,820', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=confusion_matrix, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '42,820', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '42,926', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '42,926', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '42,941', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '42,941', 'INFO', 'plot type', 'confusion_matrix']\n", - "['2020-07-31 01', '42', '42,957', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '42,957', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '42', '43,239', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '43,239', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '43,245', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '43,246', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=boundary, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '43,246', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'plot type', 'boundary']\n", - "['2020-07-31 01', '42', '43,491', 'INFO', 'Fitting StandardScaler()']\n", - "['2020-07-31 01', '42', '43,497', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 01', '42', '43,525', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '44,935', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '44,935', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '44,969', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '44,970', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=parameter, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '44,970', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'plot type', 'parameter']\n", - "['2020-07-31 01', '42', '45,092', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '45,092', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'create_model(estimator=catboost, ensemble=False, method=None, fold=10, round=4, cross_validation=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '45,120', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '45,121', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '45,122', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '45,122', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '45,127', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '45,128', 'INFO', 'CatBoost Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '45,128', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '45,133', 'INFO', 'Cross validation set to False']\n", - "['2020-07-31 01', '42', '45,134', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'create_model_container 11']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'master_model_container 11']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'display_container 13']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', '']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'create_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'interpret_model(estimator=, plot=summary, feature=None, observation=None)']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'plot type', 'summary']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '47,714', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '48,401', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '48,401', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'interpret_model(estimator=, plot=correlation, feature=None, observation=None)']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'plot type', 'correlation']\n", - "['2020-07-31 01', '42', '48,424', 'WARNING', 'No feature passed. Default value of feature used for correlation plot', 'WeekofPurchase']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '48,742', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '49,226', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '49,226', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '49,245', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '49,245', 'INFO', 'interpret_model(estimator=, plot=reason, feature=None, observation=12)']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'plot type', 'reason']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '49,564', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '49,970', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '49,970', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'Initializing automl()']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'automl(optimize=Recall, use_holdout=False)']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'Model Selection Basis', 'CV Results on Training set']\n", - "['2020-07-31 01', '42', '50,007', 'INFO', 'SubProcess finalize_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,008', 'INFO', 'Initializing finalize_model()']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', \"finalize_model(estimator=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False))']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Getting model name']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Finalizing Logistic Regression']\n", - "['2020-07-31 01', '42', '50,038', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '50,073', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,073', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', \"create_model(estimator=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '50,082', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '50,082', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Declaring custom model']\n", - "['2020-07-31 01', '42', '50,084', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '50,085', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '50,087', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '50,088', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,114', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,126', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '50,128', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,152', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,158', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,162', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '50,163', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '50,196', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,212', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,228', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '50,228', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,243', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,275', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,306', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,389', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,402', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,407', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '50,409', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,430', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'display_container', '14']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'display_container', '14']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'finalize_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'SubProcess finalize_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'automl() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '01,294', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '45', '01,295', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=best-model, verbose=True)']\n", - "['2020-07-31 01', '45', '01,295', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '45', '01,303', 'INFO', 'best-model.pkl saved in current working directory']\n", - "['2020-07-31 01', '45', '01,308', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '45', '01,309', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '03,776', 'INFO', 'Initializing deploy_model()']\n", - "['2020-07-31 01', '45', '03,776', 'INFO', \"deploy_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "[\"warm_start=False), model_name=best-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", - "['2020-07-31 01', '45', '03,798', 'INFO', 'Platform', 'AWS S3']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'Saving model in active working directory']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '45', '03,998', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=best-aws, verbose=False)']\n", - "['2020-07-31 01', '45', '03,998', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '45', '04,004', 'INFO', 'best-aws.pkl saved in current working directory']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'Initializing S3 client']\n", - "['2020-07-31 01', '45', '04,989', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '45', '04,989', 'INFO', 'deploy_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'get_config(variable=X_train)']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'Global variable', 'X_train returned']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,044', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,044', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 01', '45', '05,045', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 01', '45', '05,045', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'Initializing set_config()']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'set_config(variable=seed, value=999)']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'Global variable', 'seed updated']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'set_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '23,821', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '23,822', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=FEATURE, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '23,822', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '27,575', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '27,577', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=feature, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '27,577', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'plot type', 'feature']\n", - "['2020-07-31 01', '45', '27,691', 'WARNING', 'No coef_ found. Trying feature_importances_']\n", - "['2020-07-31 01', '45', '27,906', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '45', '27,906', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '31,933', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '31,934', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=pr, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '31,934', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'plot type', 'pr']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '45', '32,057', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '45', '32,376', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '45', '32,376', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '42,906', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '42,907', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=class_report, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '42,907', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'plot type', 'class_report']\n", - "['2020-07-31 01', '45', '43,032', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '45', '43,033', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '45', '43,362', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '45', '43,362', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '16,732', 'INFO', 'PyCaret Regression Module']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'version 2.0']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'USI', '5b1c']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'setup(data=(1338, 7), target=charges, train_size=0.7, sampling=True, sample_estimator=None, categorical_features=None, categorical_imputation=constant, ordinal_features=None,']\n", - "['high_cardinality_features=None, high_cardinality_method=frequency, numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None, remove_outliers=False, outliers_threshold=0.05,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, remove_perfect_collinearity=False, create_clusters=False, cluster_iter=20,']\n", - "['polynomial_features=False, polynomial_degree=2, trigonometry_features=False, polynomial_threshold=0.1, group_features=None,']\n", - "['group_names=None, feature_selection=False, feature_selection_threshold=0.8, feature_interaction=False, feature_ratio=False, interaction_threshold=0.01, transform_target=False,']\n", - "['transform_target_method=box-cox, data_split_shuffle=True, folds_shuffle=False, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=insurance1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'Checking environment']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 08', '44', '16,734', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Memory', 'svmem(total=17032478720, available=12508303360, percent=26.6, used=4524175360, free=12508303360)']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Checking libraries']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 08', '44', '17,421', 'INFO', 'sklearn==0.23.1']\n", - "['2020-07-31 08', '44', '17,518', 'INFO', 'xgboost==0.90']\n", - "['2020-07-31 08', '44', '17,654', 'INFO', 'lightgbm==2.3.1']\n", - "['2020-07-31 08', '44', '17,720', 'INFO', 'catboost==0.20.2']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'mlflow==1.8.0']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Checking Exceptions']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '44', '21,667', 'INFO', 'Copying data for preprocessing']\n", - "['2020-07-31 08', '44', '21,667', 'INFO', 'Declaring global variables']\n", - "['2020-07-31 08', '44', '21,672', 'INFO', 'Declaring preprocessing parameters']\n", - "['2020-07-31 08', '44', '21,672', 'INFO', 'Importing preprocessing module']\n", - "['2020-07-31 08', '44', '22,570', 'INFO', 'Creating preprocessing pipeline']\n", - "['2020-07-31 08', '44', '23,523', 'INFO', 'Preprocessing pipeline created successfully']\n", - "['2020-07-31 08', '44', '23,523', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '23,523', 'INFO', 'Creating grid variables']\n", - "['2020-07-31 08', '44', '23,525', 'INFO', 'Creating global containers']\n", - "['2020-07-31 08', '44', '23,590', 'INFO', 'Logging experiment in MLFlow']\n", - "['2020-07-31 08', '44', '23,723', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '23,724', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '23,728', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", - "['2020-07-31 08', '44', '23,728', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '23,732', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '23,740', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), None]']\n", - "['2020-07-31 08', '44', '23,740', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '23,740', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'create_model_container', '0']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'master_model_container', '0']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'display_container', '0']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'setup() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'compare_models(blacklist=None, whitelist=None, fold=5, round=4, sort=R2, n_select=1, turbo=True, verbose=True)']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '44', '25,754', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '44', '25,756', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '44', '25,767', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 08', '44', '25,768', 'INFO', 'Import successful']\n", - "['2020-07-31 08', '44', '25,774', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '44', '25,774', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '44', '25,774', 'INFO', 'Initializing Linear Regression']\n", - "['2020-07-31 08', '44', '25,782', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '25,788', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,795', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,796', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,797', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,856', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '25,873', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,876', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,877', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,877', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,883', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '25,888', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,892', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,894', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,894', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,900', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '25,905', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,907', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,909', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,909', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,915', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '25,920', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,923', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,925', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,925', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,931', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '25,932', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '25,940', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '25,990', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '25,990', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '25,991', 'INFO', 'save_model(model=LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '25,991', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '25,995', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '25,999', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), None]']\n", - "['2020-07-31 08', '44', '25,999', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '25,999', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,024', 'INFO', 'Initializing Lasso Regression']\n", - "['2020-07-31 08', '44', '26,039', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,051', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,056', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,057', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,058', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,063', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,071', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,074', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,076', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,076', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,082', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,088', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,093', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,093', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,099', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,105', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,108', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,109', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,110', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,115', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,121', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,125', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,126', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,126', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,132', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,132', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,140', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,196', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,197', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,197', 'INFO', 'save_model(model=Lasso(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=1000,']\n", - "['normalize=False, positive=False, precompute=False, random_state=123,']\n", - "[\"selection='cyclic', tol=0.0001, warm_start=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '26,197', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,201', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,205', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Lasso(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=1000,']\n", - "['normalize=False, positive=False, precompute=False, random_state=123,']\n", - "[\"selection='cyclic', tol=0.0001, warm_start=False), None]\"]\n", - "['2020-07-31 08', '44', '26,206', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,206', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,250', 'INFO', 'Initializing Ridge Regression']\n", - "['2020-07-31 08', '44', '26,255', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,260', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,265', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,266', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,266', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,272', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,278', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,281', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,283', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,283', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,289', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,294', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,297', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,298', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,298', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,304', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,309', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,312', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,314', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,314', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,320', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,325', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,329', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,330', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,330', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,336', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,336', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,346', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'save_model(model=Ridge(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=None,']\n", - "[\"normalize=False, random_state=123, solver='auto', tol=0.001), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,407', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,413', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Ridge(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=None,']\n", - "[\"normalize=False, random_state=123, solver='auto', tol=0.001), None]\"]\n", - "['2020-07-31 08', '44', '26,413', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,413', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,453', 'INFO', 'Initializing Elastic Net']\n", - "['2020-07-31 08', '44', '26,458', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,463', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,467', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,468', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,468', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,474', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,480', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,483', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,485', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,485', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,490', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,496', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,498', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,500', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,500', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,505', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,511', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,514', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,517', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,523', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,528', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,530', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,532', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,532', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,538', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,538', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,552', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,618', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,618', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,618', 'INFO', 'save_model(model=ElasticNet(alpha=1.0, copy_X=True, fit_intercept=True, l1_ratio=0.5,']\n", - "['max_iter=1000, normalize=False, positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic', tol=0.0001, warm_start=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '26,619', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,623', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,627', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ElasticNet(alpha=1.0, copy_X=True, fit_intercept=True, l1_ratio=0.5,']\n", - "['max_iter=1000, normalize=False, positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic', tol=0.0001, warm_start=False), None]\"]\n", - "['2020-07-31 08', '44', '26,627', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,628', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,667', 'INFO', 'Initializing Least Angle Regression']\n", - "['2020-07-31 08', '44', '26,672', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,678', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,684', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,686', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,686', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,692', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,698', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,703', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,705', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,705', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,710', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,716', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,721', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,723', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,723', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,728', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,735', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,742', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,744', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,744', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,751', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,756', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,762', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,764', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,764', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,771', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,772', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,787', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'save_model(model=Lars(copy_X=True, eps=2.220446049250313e-16, fit_intercept=True, fit_path=True,']\n", - "[\"jitter=None, n_nonzero_coefs=500, normalize=True, precompute='auto',\"]\n", - "['random_state=None, verbose=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,857', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Lars(copy_X=True, eps=2.220446049250313e-16, fit_intercept=True, fit_path=True,']\n", - "[\"jitter=None, n_nonzero_coefs=500, normalize=True, precompute='auto',\"]\n", - "['random_state=None, verbose=False), None]']\n", - "['2020-07-31 08', '44', '26,857', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,857', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,889', 'INFO', 'Initializing Lasso Least Angle Regression']\n", - "['2020-07-31 08', '44', '26,909', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,918', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,923', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,924', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,924', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,932', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,937', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,943', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,945', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,945', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,954', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,961', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,967', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,968', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,969', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,975', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,982', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,988', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,990', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,990', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,997', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,003', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,009', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,012', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,012', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,021', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,021', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,032', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,089', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,090', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,090', 'INFO', 'save_model(model=LassoLars(alpha=1.0, copy_X=True, eps=2.220446049250313e-16, fit_intercept=True,']\n", - "['fit_path=True, jitter=None, max_iter=500, normalize=True,']\n", - "[\"positive=False, precompute='auto', random_state=None, verbose=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '27,090', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,095', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,100', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LassoLars(alpha=1.0, copy_X=True, eps=2.220446049250313e-16, fit_intercept=True,']\n", - "['fit_path=True, jitter=None, max_iter=500, normalize=True,']\n", - "[\"positive=False, precompute='auto', random_state=None, verbose=False), None]\"]\n", - "['2020-07-31 08', '44', '27,100', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,100', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,144', 'INFO', 'Initializing Orthogonal Matching Pursuit']\n", - "['2020-07-31 08', '44', '27,148', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,155', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,158', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,160', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,160', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,166', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,173', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,177', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,178', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,179', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,186', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '27,194', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,197', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,199', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,199', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,206', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '27,213', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,216', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,218', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,218', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,224', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,232', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,236', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,237', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,237', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,244', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,245', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,262', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,325', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,325', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,326', 'INFO', 'save_model(model=OrthogonalMatchingPursuit(fit_intercept=True, n_nonzero_coefs=None,']\n", - "[\"normalize=True, precompute='auto', tol=None), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '27,326', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,331', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,335', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), OrthogonalMatchingPursuit(fit_intercept=True, n_nonzero_coefs=None,']\n", - "[\"normalize=True, precompute='auto', tol=None), None]\"]\n", - "['2020-07-31 08', '44', '27,335', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,335', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,376', 'INFO', 'Initializing Bayesian Ridge']\n", - "['2020-07-31 08', '44', '27,381', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,387', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,393', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,395', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,396', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,403', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,410', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,415', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,417', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,417', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,423', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '27,429', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,434', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,435', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,436', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,441', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '27,447', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,455', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,457', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,457', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,463', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,474', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,476', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,476', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,482', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,482', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,493', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,550', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,551', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,551', 'INFO', 'save_model(model=BayesianRidge(alpha_1=1e-06, alpha_2=1e-06, alpha_init=None,']\n", - "['compute_score=False, copy_X=True, fit_intercept=True,']\n", - "['lambda_1=1e-06, lambda_2=1e-06, lambda_init=None, n_iter=300,']\n", - "['normalize=False, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '27,551', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,556', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,559', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), BayesianRidge(alpha_1=1e-06, alpha_2=1e-06, alpha_init=None,']\n", - "['compute_score=False, copy_X=True, fit_intercept=True,']\n", - "['lambda_1=1e-06, lambda_2=1e-06, lambda_init=None, n_iter=300,']\n", - "['normalize=False, tol=0.001, verbose=False), None]']\n", - "['2020-07-31 08', '44', '27,559', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,559', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,590', 'INFO', 'Initializing Passive Aggressive Regressor']\n", - "['2020-07-31 08', '44', '27,606', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,619', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,620', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,620', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,626', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,631', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,638', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,640', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,640', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,645', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '27,651', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,656', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,658', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,658', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,664', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '27,669', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,675', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,677', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,677', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,683', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,687', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,694', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,696', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,696', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,701', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,702', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,712', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,773', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,773', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,774', 'INFO', 'save_model(model=PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']\n", - "['epsilon=0.1, fit_intercept=True,']\n", - "[\"loss='epsilon_insensitive', max_iter=1000,\"]\n", - "['n_iter_no_change=5, random_state=123, shuffle=True,']\n", - "['tol=0.001, validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '27,774', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,775', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,783', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']\n", - "['epsilon=0.1, fit_intercept=True,']\n", - "[\"loss='epsilon_insensitive', max_iter=1000,\"]\n", - "['n_iter_no_change=5, random_state=123, shuffle=True,']\n", - "['tol=0.001, validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), None]']\n", - "['2020-07-31 08', '44', '27,783', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,783', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,826', 'INFO', 'Initializing Random Sample Consensus']\n", - "['2020-07-31 08', '44', '27,831', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,836', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,923', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,924', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,924', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,930', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,935', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,015', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,017', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,017', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,022', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '28,027', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,105', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,106', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,106', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,112', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '28,116', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,195', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,197', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,197', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,202', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '28,208', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,298', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,300', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,300', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,306', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '28,306', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '28,322', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'save_model(model=RANSACRegressor(base_estimator=None, is_data_valid=None, is_model_valid=None,']\n", - "[\"loss='absolute_loss', max_skips=inf, max_trials=100,\"]\n", - "['min_samples=0.5, random_state=123, residual_threshold=None,']\n", - "['stop_n_inliers=inf, stop_probability=0.99, stop_score=inf), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '28,396', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RANSACRegressor(base_estimator=None, is_data_valid=None, is_model_valid=None,']\n", - "[\"loss='absolute_loss', max_skips=inf, max_trials=100,\"]\n", - "['min_samples=0.5, random_state=123, residual_threshold=None,']\n", - "['stop_n_inliers=inf, stop_probability=0.99, stop_score=inf), None]']\n", - "['2020-07-31 08', '44', '28,396', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '28,396', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '28,441', 'INFO', 'Initializing TheilSen Regressor']\n", - "['2020-07-31 08', '44', '28,446', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '28,450', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '30,326', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '30,328', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '30,328', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '30,334', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '30,339', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '30,808', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '30,808', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '30,808', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '30,824', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '30,830', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '31,292', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '31,292', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '31,292', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '31,307', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '31,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '31,820', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '31,822', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '31,822', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '31,827', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '31,827', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,321', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,321', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,321', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,336', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '32,336', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '32,353', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '32,409', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '32,409', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'save_model(model=TheilSenRegressor(copy_X=True, fit_intercept=True, max_iter=300,']\n", - "['max_subpopulation=10000, n_jobs=-1, n_subsamples=None,']\n", - "['random_state=123, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), TheilSenRegressor(copy_X=True, fit_intercept=True, max_iter=300,']\n", - "['max_subpopulation=10000, n_jobs=-1, n_subsamples=None,']\n", - "['random_state=123, tol=0.001, verbose=False), None]']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '32,457', 'INFO', 'Initializing Huber Regressor']\n", - "['2020-07-31 08', '44', '32,457', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '32,468', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,520', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,522', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,522', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,527', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '32,527', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,580', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,580', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,586', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '32,591', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,636', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,638', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,638', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,643', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '32,650', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,690', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,692', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,692', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,697', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '32,702', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,749', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,750', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,750', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,756', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '32,756', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '32,761', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '32,821', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '32,822', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '32,822', 'INFO', 'save_model(model=HuberRegressor(alpha=0.0001, epsilon=1.35, fit_intercept=True, max_iter=100,']\n", - "['tol=1e-05, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '32,822', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '32,827', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '32,831', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), HuberRegressor(alpha=0.0001, epsilon=1.35, fit_intercept=True, max_iter=100,']\n", - "['tol=1e-05, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '32,831', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '32,831', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '32,860', 'INFO', 'Initializing Support Vector Machine']\n", - "['2020-07-31 08', '44', '32,860', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '32,880', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,938', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,942', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,943', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,948', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '32,953', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,976', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,981', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,981', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,986', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '32,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,013', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,018', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,018', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,024', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '33,029', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,053', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,058', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,058', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,062', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '33,067', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,096', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,096', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,101', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '33,102', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '33,113', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '33,175', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '33,176', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '33,176', 'INFO', \"save_model(model=SVR(C=1.0, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma='scale',\"]\n", - "[\"kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '33,176', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '33,177', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '33,177', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), SVR(C=1.0, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma='scale',\"]\n", - "[\"kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False), None]\"]\n", - "['2020-07-31 08', '44', '33,177', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '33,177', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '33,211', 'INFO', 'Initializing K Neighbors Regressor']\n", - "['2020-07-31 08', '44', '33,227', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '33,227', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,227', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,358', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,358', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,373', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '33,383', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,388', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,507', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,507', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,507', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '33,519', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,523', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,641', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,641', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,657', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '33,669', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,674', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,780', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,780', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,788', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '33,794', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,798', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '33,945', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '34,004', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '34,005', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '34,005', 'INFO', \"save_model(model=KNeighborsRegressor(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '34,005', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '34,010', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '34,011', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), KNeighborsRegressor(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform'), None]\"]\n", - "['2020-07-31 08', '44', '34,011', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '34,011', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '34,042', 'INFO', 'Initializing Decision Tree']\n", - "['2020-07-31 08', '44', '34,060', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '34,065', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,070', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,072', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,072', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,078', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '34,084', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,089', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,090', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,090', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,096', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '34,101', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,105', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,107', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,107', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,113', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '34,118', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,122', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,124', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,124', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,130', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '34,135', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,140', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,141', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,141', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,147', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '34,147', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '34,159', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '34,216', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '34,217', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '34,217', 'INFO', \"save_model(model=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '34,217', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '34,222', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '34,226', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), None]\"]\n", - "['2020-07-31 08', '44', '34,226', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '34,226', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '34,259', 'INFO', 'Initializing Random Forest']\n", - "['2020-07-31 08', '44', '34,259', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '34,276', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,425', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,550', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,550', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,550', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '34,561', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,708', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,813', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,814', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,828', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '34,844', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '35,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '35,197', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '35,197', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '35,203', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '35,208', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '35,456', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '35,575', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '35,575', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '35,582', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '35,590', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '35,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '35,981', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', \"save_model(model=RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '36,123', 'INFO', 'Initializing Extra Trees Regressor']\n", - "['2020-07-31 08', '44', '36,123', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '36,141', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '36,290', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '36,396', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '36,396', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '36,412', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '36,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '36,574', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '36,684', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '36,684', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '36,684', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '36,699', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '36,842', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '36,962', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '36,962', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '36,977', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '36,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,141', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,267', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,267', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,282', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '37,299', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,441', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '37,573', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', \"save_model(model=ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '37,739', 'INFO', 'Initializing AdaBoost Regressor']\n", - "['2020-07-31 08', '44', '37,739', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '37,758', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,782', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,785', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,785', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,790', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '37,797', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,817', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,820', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,820', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,827', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '37,833', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,851', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,854', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,854', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,861', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '37,866', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,882', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,884', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,884', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,891', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '37,897', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,916', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,918', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,918', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,925', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '37,925', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '37,939', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '37,998', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '37,998', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '37,999', 'INFO', \"save_model(model=AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '37,999', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '38,008', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '38,013', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), None]']\n", - "['2020-07-31 08', '44', '38,013', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '38,013', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '38,045', 'INFO', 'Initializing Gradient Boosting Regressor']\n", - "['2020-07-31 08', '44', '38,045', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '38,066', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,130', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,145', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,145', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,145', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '38,159', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '38,245', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,320', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,320', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,326', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '38,332', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '38,415', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,484', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,486', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,486', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,492', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '38,492', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '38,508', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', \"save_model(model=GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '38,578', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '38,578', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '38,578', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '38,625', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 08', '44', '38,625', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '38,642', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,685', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,686', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,687', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,697', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '38,711', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,753', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,755', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,755', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,773', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '38,783', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,827', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,829', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,829', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,846', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '38,855', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,899', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,901', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,901', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,914', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '38,926', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,968', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,970', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,970', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,982', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '38,983', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '39,014', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', \"save_model(model=XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '39,112', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), None]']\n", - "['2020-07-31 08', '44', '39,112', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '39,112', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '39,143', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 08', '44', '39,159', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '39,165', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,231', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,246', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,246', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,246', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '39,269', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,361', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,365', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,365', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,378', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '39,388', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,482', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,486', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,486', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,499', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '39,510', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,581', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,581', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,581', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,596', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '39,608', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,693', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,697', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,697', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,710', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '39,710', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '39,742', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '39,836', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '39,836', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '39,837', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '39,837', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '39,956', 'INFO', 'Initializing CatBoost Regressor']\n", - "['2020-07-31 08', '44', '39,961', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '39,969', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '41,306', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '41,306', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '41,306', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '41,322', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '41,330', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '42,400', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '42,402', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '42,403', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '42,410', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '42,416', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '43,476', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '43,492', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '43,492', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '43,492', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '43,504', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '44,627', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '45,723', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '45,774', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '45,775', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '45,775', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '45,775', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '45,813', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '45,834', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), , None]']\n", - "['2020-07-31 08', '44', '45,834', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '45,834', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '45,916', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 08', '44', '45,916', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'create_model(estimator=xgboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '44', '45,935', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '44', '45,935', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '44', '45,936', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '44', '45,936', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '44', '45,937', 'INFO', 'Extreme Gradient Boosting Regressor Imported succesfully']\n", - "['2020-07-31 08', '44', '45,937', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '44', '45,938', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '45,939', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '45,977', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '45,979', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '45,979', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '45,990', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '45,992', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,031', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,033', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,033', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,044', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '46,048', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,067', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '46,145', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,176', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,176', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,176', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,192', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '44', '46,192', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,223', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,223', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,223', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,239', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '44', '46,239', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,270', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,270', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,270', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,286', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '44', '46,286', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,335', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,337', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,337', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,349', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '44', '46,350', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,397', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,397', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,397', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,412', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '44', '46,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,459', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,459', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,475', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '46,475', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '46,490', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'display_container', '1']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', \"XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'create_model() succesfully completed......................................']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '46,521', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'display_container', '2']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', \"XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '06,693', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '06,693', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '06,694', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '06,694', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '06,694', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '06,717', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '06,717', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '06,718', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '06,718', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '06,722', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '06,723', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '06,728', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '06,733', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '06,819', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '06,823', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '06,823', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '06,852', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '06,860', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '06,951', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '06,955', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '06,955', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '06,984', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '06,992', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,090', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,094', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,094', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,123', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '07,132', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,207', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,207', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,207', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,246', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '07,255', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,339', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,343', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,343', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,374', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '07,383', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,466', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,469', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,469', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,499', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '07,507', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,591', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,595', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,595', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,626', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '07,635', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,717', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,721', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,721', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,753', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '07,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,842', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,842', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,842', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,877', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '07,885', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,972', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,975', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '08,009', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '08,011', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '08,024', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '08,113', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '08,329', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '08,329', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '08,330', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '08,330', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '08,349', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '08,360', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '08,360', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '08,361', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '08,401', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '08,401', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'create_model_container', '2']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'master_model_container', '2']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'display_container', '3']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '09,735', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '09,754', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '09,755', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '09,756', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '09,756', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '09,761', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '09,761', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '09,766', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '09,771', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '09,853', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '09,857', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '09,857', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '09,886', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '09,894', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '09,980', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '09,984', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '09,984', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,013', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '10,023', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,104', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,108', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,108', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,137', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '10,145', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,250', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,253', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,254', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,285', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '10,294', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,393', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,396', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,397', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,426', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '10,435', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,516', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,520', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,520', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,542', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '10,565', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,650', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,654', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,654', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,685', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '10,693', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,777', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,780', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,781', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,812', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '10,821', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,905', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,910', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,910', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,948', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '10,957', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '11,041', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '11,045', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '11,045', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '11,075', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '11,077', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '11,094', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '11,191', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '11,397', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '11,397', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '11,398', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '11,399', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '11,417', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '11,427', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '11,428', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '11,428', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '11,465', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '11,465', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '11,521', 'INFO', 'create_model_container', '3']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', 'master_model_container', '3']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', 'display_container', '4']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '11,540', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '11,541', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '11,542', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '11,542', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '11,546', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '11,547', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '11,551', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '11,557', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '11,638', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '11,642', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '11,642', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '11,670', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '11,679', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '11,784', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '11,788', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '11,788', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '11,812', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '11,820', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,003', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,007', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,007', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,037', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '12,046', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,125', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,126', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,126', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,159', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '12,168', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,250', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,254', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,254', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,285', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '12,294', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,383', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,387', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,387', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,417', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '12,426', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,492', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,508', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,508', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,542', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '12,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,660', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,663', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,664', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,698', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '12,708', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,794', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,798', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,798', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,830', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '12,838', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,921', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,925', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,925', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,959', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '12,961', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '12,975', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '13,077', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '13,302', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '13,303', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '13,304', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.2, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '13,304', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '13,323', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '13,335', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.2, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '13,335', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '13,335', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '13,373', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '13,373', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', 'create_model_container', '4']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', 'master_model_container', '4']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', 'display_container', '5']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.2, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '13,452', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '13,452', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '13,453', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '13,453', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '13,458', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '13,458', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '13,463', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '13,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,542', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,542', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,542', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,579', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '13,588', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,659', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,659', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,659', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,700', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '13,708', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,776', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,776', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,776', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,820', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '13,828', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,910', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,910', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,910', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,943', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '13,951', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,043', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,043', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,043', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,081', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '14,090', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,196', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,200', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,200', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,230', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '14,240', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,334', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,337', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,338', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,370', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '14,379', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,463', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,467', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,467', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,498', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '14,507', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,588', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,592', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,592', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,625', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '14,634', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,732', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,736', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,736', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,767', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '14,769', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '14,783', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '14,871', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '15,089', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '15,090', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '15,091', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.30000000000000004,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '15,091', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '15,110', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '15,122', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.30000000000000004,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '15,122', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '15,122', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '15,159', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '15,159', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'display_container', '6']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.30000000000000004,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0)']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '15,236', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '15,237', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '15,238', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '15,238', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '15,242', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '15,243', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '15,247', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '15,252', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,327', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,327', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,327', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,364', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '15,373', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,457', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,461', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,461', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,489', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '15,497', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,578', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,578', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,578', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,610', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '15,619', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,726', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,730', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,730', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,759', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '15,769', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,861', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,865', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,865', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,897', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '15,906', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,004', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,008', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,039', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '16,049', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,142', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,146', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,147', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,180', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '16,189', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,280', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,284', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,284', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,315', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '16,325', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,410', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,414', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,414', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,449', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '16,458', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,553', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,557', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,557', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,592', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '16,594', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '16,608', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '16,701', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '16,919', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '16,920', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '16,921', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.4, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '16,922', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '16,944', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '16,956', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.4, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '16,956', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '16,956', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '16,995', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '16,995', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '17,052', 'INFO', 'create_model_container', '6']\n", - "['2020-07-31 08', '45', '17,052', 'INFO', 'master_model_container', '6']\n", - "['2020-07-31 08', '45', '17,053', 'INFO', 'display_container', '7']\n", - "['2020-07-31 08', '45', '17,053', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.4, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '17,053', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '17,072', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '17,072', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '17,073', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '17,074', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '17,078', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '17,079', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '17,083', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '17,087', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,160', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,160', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,160', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,198', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '17,207', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,292', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,296', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,296', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,323', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '17,333', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,428', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,432', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,432', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,465', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '17,474', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,575', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,578', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,579', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,610', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '17,618', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,703', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,707', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,707', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,738', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '17,744', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,830', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,834', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,834', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,865', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '17,873', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,945', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,961', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,961', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,992', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '18,001', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '18,090', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '18,094', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '18,094', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '18,128', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '18,140', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '18,227', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '18,232', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '18,232', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '18,268', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '18,276', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '18,360', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '18,364', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '18,365', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '18,399', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '18,401', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '18,414', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '18,521', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.5, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '18,795', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '18,811', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.5, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '18,811', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '18,811', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '18,857', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '18,857', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'create_model_container', '7']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'master_model_container', '7']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'display_container', '8']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.5, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '18,934', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '18,935', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '18,935', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '18,936', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '18,940', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '18,941', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '18,946', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '18,951', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,042', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,046', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,047', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,076', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '19,087', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,162', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,162', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,205', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '19,214', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,296', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,296', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,296', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,330', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '19,339', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,424', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,428', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,428', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,458', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '19,467', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,578', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,578', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,578', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,618', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '19,628', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,716', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,720', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,720', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,752', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '19,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,843', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,847', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,848', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,881', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '19,890', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,986', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,990', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,990', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,023', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '20,032', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,122', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,126', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,126', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,163', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '20,172', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,246', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,246', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,246', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,292', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '20,294', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '20,309', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '20,394', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '20,611', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '20,612', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '20,613', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.6, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '20,613', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '20,630', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '20,645', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.6, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '20,645', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '20,645', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '20,692', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '20,692', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '20,742', 'INFO', 'create_model_container', '8']\n", - "['2020-07-31 08', '45', '20,742', 'INFO', 'master_model_container', '8']\n", - "['2020-07-31 08', '45', '20,742', 'INFO', 'display_container', '9']\n", - "['2020-07-31 08', '45', '20,743', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.6, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '20,743', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '20,760', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '20,760', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '20,761', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '20,761', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '20,765', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '20,766', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '20,770', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '20,777', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,846', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,846', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,846', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,888', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '20,897', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,996', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,996', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,996', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,041', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '21,051', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,162', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,200', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '21,215', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,297', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,313', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,313', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,346', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '21,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,450', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,454', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,454', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,485', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '21,497', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,597', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,601', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,601', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,634', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '21,643', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,742', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,747', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,747', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,782', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '21,795', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,879', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,879', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,879', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,924', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '21,934', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '22,027', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '22,043', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '22,043', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '22,084', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '22,093', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '22,195', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '22,195', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '22,195', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '22,245', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '22,248', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '22,266', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '22,362', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '22,584', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '22,584', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '22,586', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.7000000000000001,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '22,586', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '22,609', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '22,614', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.7000000000000001,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '22,614', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '22,614', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '22,692', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '22,692', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '22,739', 'INFO', 'create_model_container', '9']\n", - "['2020-07-31 08', '45', '22,739', 'INFO', 'master_model_container', '9']\n", - "['2020-07-31 08', '45', '22,739', 'INFO', 'display_container', '10']\n", - "['2020-07-31 08', '45', '22,743', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.7000000000000001,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0)']\n", - "['2020-07-31 08', '45', '22,743', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '22,744', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '22,799', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '22,802', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '22,803', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '22,803', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '22,812', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '22,812', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '22,827', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '22,844', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '22,930', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '22,930', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '22,930', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '22,969', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '22,979', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,064', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,064', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,064', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,098', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '23,113', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,197', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,197', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,197', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,235', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '23,244', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,330', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,331', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,331', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,365', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '23,375', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,498', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,502', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,503', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,544', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '23,554', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,660', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,664', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,664', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,699', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '23,710', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,811', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,816', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,816', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,851', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '23,861', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,947', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,947', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,947', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,987', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '23,996', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,081', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,081', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,081', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '24,122', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '24,132', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,229', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,229', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,229', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '24,271', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '24,273', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '24,288', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '24,380', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '24,596', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '24,597', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '24,598', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.8, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '24,598', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '24,614', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '24,614', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.8, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '24,629', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '24,629', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '24,660', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '24,660', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'create_model_container', '10']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'master_model_container', '10']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'display_container', '11']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.8, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '24,744', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '24,744', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '24,745', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '24,745', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '24,750', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '24,750', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '24,755', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '24,760', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,841', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,845', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,845', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '24,875', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '24,884', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,965', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,965', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,965', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,005', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '25,015', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,130', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,130', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,130', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,165', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '25,165', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,280', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,280', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,280', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,318', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '25,327', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,423', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,427', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,427', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,460', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '25,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,572', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,577', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,577', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,612', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '25,621', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,698', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,698', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,698', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,747', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '25,755', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,832', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,832', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,832', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,878', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '25,887', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,981', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,986', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,986', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '26,023', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '26,034', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '26,137', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '26,142', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '26,142', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '26,180', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '26,182', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '26,197', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '26,299', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '26,531', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '26,532', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '26,533', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.9, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '26,533', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '26,548', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '26,564', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.9, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '26,564', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '26,564', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '26,626', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '26,626', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '26,673', 'INFO', 'create_model_container', '11']\n", - "['2020-07-31 08', '45', '26,673', 'INFO', 'master_model_container', '11']\n", - "['2020-07-31 08', '45', '26,673', 'INFO', 'display_container', '12']\n", - "['2020-07-31 08', '45', '26,675', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.9, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '26,675', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '35,225', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 08', '45', '35,225', 'INFO', \"tune_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), fold=10, round=4, n_iter=50, custom_grid=None, optimize=MAE, choose_better=False, verbose=True)']\n", - "['2020-07-31 08', '45', '35,226', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '35,226', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '35,226', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '35,246', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '35,246', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '35,247', 'INFO', 'Checking base model']\n", - "['2020-07-31 08', '45', '35,248', 'INFO', 'Base model', 'Light Gradient Boosting Machine']\n", - "['2020-07-31 08', '45', '35,249', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '35,249', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '35,255', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 08', '45', '35,255', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 08', '45', '37,358', 'INFO', 'Random search completed']\n", - "['2020-07-31 08', '45', '37,367', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '37,377', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,389', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,392', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,423', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '37,431', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,444', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,447', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,478', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '37,488', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,500', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,504', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,536', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '37,545', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,564', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,567', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,598', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '37,608', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,621', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,625', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,656', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '37,664', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,677', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,681', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,717', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '37,726', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,738', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,741', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,778', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '37,788', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,802', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,806', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,841', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '37,851', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,863', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,866', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,903', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '37,913', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,926', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,930', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,967', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '37,969', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '37,984', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '37,996', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '37,996', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '37,997', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '38,113', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '38,113', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '38,114', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.3, max_depth=70,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.2,']\n", - "['n_estimators=10, n_jobs=-1, num_leaves=10, objective=None,']\n", - "['random_state=123, reg_alpha=0.4, reg_lambda=0.1, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '38,114', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '38,121', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '38,132', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.3, max_depth=70,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.2,']\n", - "['n_estimators=10, n_jobs=-1, num_leaves=10, objective=None,']\n", - "['random_state=123, reg_alpha=0.4, reg_lambda=0.1, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '38,132', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,132', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '38,394', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 08', '45', '38,394', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 08', '45', '38,395', 'INFO', 'display_container', '13']\n", - "['2020-07-31 08', '45', '38,395', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.3, max_depth=70,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.2,']\n", - "['n_estimators=10, n_jobs=-1, num_leaves=10, objective=None,']\n", - "['random_state=123, reg_alpha=0.4, reg_lambda=0.1, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '38,395', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,408', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'create_model(estimator=dt, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '38,428', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '38,428', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '38,429', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '38,430', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '38,435', 'INFO', 'Decision Tree Regressor Imported succesfully']\n", - "['2020-07-31 08', '45', '38,437', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '38,440', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '38,446', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,451', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,453', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,453', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,467', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '38,472', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,479', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,479', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,493', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '38,500', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,505', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,507', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,507', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,521', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '38,527', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,532', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,534', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,534', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,549', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '38,555', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,560', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,562', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,562', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,577', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '38,583', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,588', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,590', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,590', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,606', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '38,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,617', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,619', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,619', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,635', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '38,640', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,647', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,648', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,648', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,664', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '38,671', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,675', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,677', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,677', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,693', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '38,698', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,704', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,705', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,705', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,722', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '38,723', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '38,731', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '38,739', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '38,888', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '38,888', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '38,889', 'INFO', \"save_model(model=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '45', '38,889', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '38,895', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '38,900', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), None]\"]\n", - "['2020-07-31 08', '45', '38,900', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,901', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '38,918', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '38,918', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '38,949', 'INFO', 'create_model_container', '13']\n", - "['2020-07-31 08', '45', '38,949', 'INFO', 'master_model_container', '13']\n", - "['2020-07-31 08', '45', '38,949', 'INFO', 'display_container', '14']\n", - "['2020-07-31 08', '45', '38,950', 'INFO', \"DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')\"]\n", - "['2020-07-31 08', '45', '38,950', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', \"ensemble_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Bagging, fold=10, n_estimators=50, round=4, choose_better=False, optimize=R2, verbose=True)\"]\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '38,978', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '38,978', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '38,980', 'INFO', 'Checking base model']\n", - "['2020-07-31 08', '45', '38,981', 'INFO', 'Base model', 'Decision Tree']\n", - "['2020-07-31 08', '45', '38,985', 'INFO', 'BaggingRegressor() succesfully imported']\n", - "['2020-07-31 08', '45', '38,990', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '38,991', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '38,996', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,156', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,178', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '39,183', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,330', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,335', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,350', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '39,355', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,486', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,486', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,515', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '39,521', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,651', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,666', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,684', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '39,689', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,816', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,816', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,844', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '39,849', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,986', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,986', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,007', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '40,012', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,154', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,154', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,178', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '40,183', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,327', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,332', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,348', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '40,353', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,503', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,528', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '40,533', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,698', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,704', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,721', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '40,722', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '40,730', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '40,882', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '40,882', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '40,883', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '40,950', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '40,951', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '40,952', 'INFO', 'save_model(model=BaggingRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '40,952', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '40,976', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '40,981', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), BaggingRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '45', '40,981', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '40,981', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'create_model_container', '14']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'master_model_container', '14']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'display_container', '15']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'BaggingRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '41,133', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 08', '45', '41,134', 'INFO', \"ensemble_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Boosting, fold=10, n_estimators=10, round=4, choose_better=False, optimize=R2, verbose=True)\"]\n", - "['2020-07-31 08', '45', '41,134', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '41,134', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '41,134', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '41,157', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '41,157', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '41,159', 'INFO', 'Checking base model']\n", - "['2020-07-31 08', '45', '41,160', 'INFO', 'Base model', 'Decision Tree']\n", - "['2020-07-31 08', '45', '41,166', 'INFO', 'AdaBoostRegressor() succesfully imported']\n", - "['2020-07-31 08', '45', '41,172', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '41,172', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '41,179', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,214', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,228', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '41,233', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,265', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,268', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,283', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '41,288', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,322', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,325', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,339', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '41,345', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,378', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,380', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,395', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '41,399', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,443', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,445', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,460', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '41,465', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,496', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,499', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,516', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '41,521', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,555', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,557', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,573', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '41,578', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,616', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,619', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,638', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '41,644', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,686', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,690', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,707', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '41,713', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,749', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,751', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,768', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '41,768', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '41,776', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '41,814', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '41,814', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '41,814', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '41,869', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '41,869', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '41,870', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '41,871', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '41,878', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '41,883', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '45', '41,883', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '41,883', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '42,011', 'INFO', 'create_model_container', '15']\n", - "['2020-07-31 08', '45', '42,011', 'INFO', 'master_model_container', '15']\n", - "['2020-07-31 08', '45', '42,011', 'INFO', 'display_container', '16']\n", - "['2020-07-31 08', '45', '42,012', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '45', '42,012', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Initializing blend_models()']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'blend_models(estimator_list=All, fold=10, round=4, choose_better=False, optimize=R2, turbo=True, verbose=True)']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '42,034', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '42,034', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '42,036', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '42,036', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '42,041', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 08', '45', '42,041', 'INFO', 'Import successful']\n", - "['2020-07-31 08', '45', '42,042', 'INFO', 'Defining model names in estimator_list']\n", - "['2020-07-31 08', '45', '45,250', 'INFO', 'n_jobs multiple passed']\n", - "['2020-07-31 08', '45', '45,265', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '45,280', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '48,335', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '48,715', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '48,739', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '48,753', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '51,531', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '51,907', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '51,935', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '51,944', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '54,960', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '55,340', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '55,370', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '55,380', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '58,319', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '58,719', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '58,743', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '58,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '01,634', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '02,022', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '02,053', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '02,064', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '04,996', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '05,375', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '05,404', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '05,415', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '08,454', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '08,850', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '08,884', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '08,894', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '11,712', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '12,102', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '12,118', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '12,134', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '14,865', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '15,254', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '15,270', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '15,286', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '18,564', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '18,970', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '19,005', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '19,007', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '19,022', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '22,593', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '22,593', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '22,594', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '22,641', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '22,642', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '22,679', 'INFO', \"save_model(model=VotingRegressor(estimators=[('Linear Regression_0',\"]\n", - "['LinearRegression(copy_X=True, fit_intercept=True,']\n", - "['n_jobs=-1, normalize=False)),']\n", - "[\"('Lasso_1',\"]\n", - "['Lasso(alpha=1.0, copy_X=True, fit_intercept=True,']\n", - "['max_iter=1000, normalize=False,']\n", - "['positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic',\"]\n", - "['tol=0.0001, warm_start=False)),']\n", - "[\"('Ridge_2',\"]\n", - "['Ridge(alpha=1.0, copy_X=True...']\n", - "['min_child_samples=20,']\n", - "['min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100,']\n", - "['n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123,']\n", - "['reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0,']\n", - "['subsample_for_bin=200000,']\n", - "['subsample_freq=0)),']\n", - "[\"('CatBoost Regressor_21',\"]\n", - "[')],']\n", - "['n_jobs=-1, verbose=False, weights=None), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '22,679', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '22,831', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '22,915', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), VotingRegressor(estimators=[('Linear Regression_0',\"]\n", - "['LinearRegression(copy_X=True, fit_intercept=True,']\n", - "['n_jobs=-1, normalize=False)),']\n", - "[\"('Lasso_1',\"]\n", - "['Lasso(alpha=1.0, copy_X=True, fit_intercept=True,']\n", - "['max_iter=1000, normalize=False,']\n", - "['positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic',\"]\n", - "['tol=0.0001, warm_start=False)),']\n", - "[\"('Ridge_2',\"]\n", - "['Ridge(alpha=1.0, copy_X=True...']\n", - "['min_child_samples=20,']\n", - "['min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100,']\n", - "['n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123,']\n", - "['reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0,']\n", - "['subsample_for_bin=200000,']\n", - "['subsample_freq=0)),']\n", - "[\"('CatBoost Regressor_21',\"]\n", - "[')],']\n", - "['n_jobs=-1, verbose=False, weights=None), None]']\n", - "['2020-07-31 08', '46', '22,915', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '22,915', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '23,715', 'INFO', 'create_model_container', '16']\n", - "['2020-07-31 08', '46', '23,715', 'INFO', 'master_model_container', '16']\n", - "['2020-07-31 08', '46', '23,715', 'INFO', 'display_container', '17']\n", - "['2020-07-31 08', '46', '23,735', 'INFO', \"VotingRegressor(estimators=[('Linear Regression_0',\"]\n", - "['LinearRegression(copy_X=True, fit_intercept=True,']\n", - "['n_jobs=-1, normalize=False)),']\n", - "[\"('Lasso_1',\"]\n", - "['Lasso(alpha=1.0, copy_X=True, fit_intercept=True,']\n", - "['max_iter=1000, normalize=False,']\n", - "['positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic',\"]\n", - "['tol=0.0001, warm_start=False)),']\n", - "[\"('Ridge_2',\"]\n", - "['Ridge(alpha=1.0, copy_X=True...']\n", - "['min_child_samples=20,']\n", - "['min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100,']\n", - "['n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123,']\n", - "['reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0,']\n", - "['subsample_for_bin=200000,']\n", - "['subsample_freq=0)),']\n", - "[\"('CatBoost Regressor_21',\"]\n", - "[')],']\n", - "['n_jobs=-1, verbose=False, weights=None)']\n", - "['2020-07-31 08', '46', '23,735', 'INFO', 'blend_models() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', \"compare_models(blacklist=None, whitelist=['rf', 'et', 'ada', 'gbr', 'xgboost', 'lightgbm', 'catboost'], fold=5, round=4, sort=R2, n_select=5, turbo=True, verbose=True)\"]\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '23,764', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '23,765', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '23,770', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 08', '46', '23,771', 'INFO', 'Import successful']\n", - "['2020-07-31 08', '46', '23,777', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '23,777', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '23,777', 'INFO', 'Initializing Random Forest']\n", - "['2020-07-31 08', '46', '23,782', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '23,789', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '24,034', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '24,142', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '24,143', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '24,164', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '24,176', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '24,434', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '24,549', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '24,549', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '24,561', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '24,578', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '24,918', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '25,038', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '25,038', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '25,064', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '25,081', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '25,328', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '25,435', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '25,436', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '25,448', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '25,458', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '25,707', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '25,838', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', \"save_model(model=RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '25,987', 'INFO', 'Initializing Extra Trees Regressor']\n", - "['2020-07-31 08', '46', '25,992', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '25,998', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '26,142', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '26,268', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '26,268', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '26,284', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '26,303', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '26,440', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '26,546', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '26,546', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '26,553', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '26,563', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '26,705', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '26,821', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '26,821', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '26,836', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '26,852', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,011', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,117', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,118', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,139', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '27,139', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '27,436', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '27,502', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '27,502', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '27,503', 'INFO', \"save_model(model=ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '27,503', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '27,523', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '27,539', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '46', '27,539', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '27,539', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '27,586', 'INFO', 'Initializing AdaBoost Regressor']\n", - "['2020-07-31 08', '46', '27,601', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '27,601', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '27,647', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,663', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,665', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,665', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,670', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,689', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '27,689', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '46', '27,705', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '27,721', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '27,752', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', \"save_model(model=AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), None]']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '27,846', 'INFO', 'Initializing Gradient Boosting Regressor']\n", - "['2020-07-31 08', '46', '27,846', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '27,861', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,924', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,924', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,924', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,939', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '27,939', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,002', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '28,189', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,252', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,252', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,252', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,267', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '28,267', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '28,267', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', \"save_model(model=GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '28,408', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 08', '46', '28,408', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '28,424', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,471', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,471', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,471', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,486', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '28,502', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,549', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,549', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,549', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,564', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '28,580', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,611', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,611', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,611', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,627', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '28,642', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,689', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,689', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,689', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,705', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '28,720', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,767', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,783', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,783', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,799', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '28,799', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '28,830', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', \"save_model(model=XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), None]']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '29,017', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 08', '46', '29,017', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '29,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,127', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,127', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,127', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,142', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '29,158', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,252', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,267', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,267', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,283', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '29,283', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,392', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,392', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,392', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,423', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '29,423', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,533', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,533', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,533', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,548', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '29,564', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,658', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,673', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,673', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,689', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '29,689', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '29,720', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '29,861', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '29,876', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '46', '29,876', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '29,876', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '29,970', 'INFO', 'Initializing CatBoost Regressor']\n", - "['2020-07-31 08', '46', '29,970', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '29,986', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '31,376', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '31,392', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '31,392', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '31,392', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '31,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '32,847', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '32,863', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '32,863', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '32,863', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '32,878', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '34,175', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '34,175', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '34,175', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '34,190', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '34,190', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '35,598', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,028', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,028', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '37,028', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,043', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '37,043', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '37,059', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), , None]']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '37,184', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 08', '46', '37,184', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'create_model(estimator=xgboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Extreme Gradient Boosting Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,246', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,246', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,246', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,262', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '37,262', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,309', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,309', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,309', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,325', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '37,325', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,371', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,371', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,371', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,387', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '37,387', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,434', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,434', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,434', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,449', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '37,449', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,496', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,496', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,496', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,512', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '37,512', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,559', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,559', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,559', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,574', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '37,590', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,621', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,637', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,637', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,653', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '37,653', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,699', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,699', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,699', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,715', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '37,715', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,762', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,762', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,762', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,778', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '37,778', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,840', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,840', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,856', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '37,856', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '37,871', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'create_model_container', '17']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'master_model_container', '17']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'display_container', '18']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', \"XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'create_model(estimator=gbr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Gradient Boosting Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,324', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,324', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,324', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,340', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '38,340', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,418', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,418', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,418', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,434', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '38,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,590', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,590', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,590', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,605', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '38,605', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '38,933', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'create_model_container', '18']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'master_model_container', '18']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'display_container', '19']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', \"GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False)']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'create_model(estimator=catboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'CatBoost Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '41,620', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '41,620', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '41,620', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '41,636', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '41,636', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '42,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '45,653', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '45,653', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '45,653', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '45,669', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '45,669', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '47,181', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '47,181', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '47,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '47,197', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '47,197', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '48,509', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '48,509', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '48,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '48,524', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '48,524', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '49,928', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '49,939', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '49,940', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '49,953', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '49,955', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '51,527', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '51,530', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '51,530', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '51,540', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '51,542', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '53,254', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '53,260', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '53,260', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '53,270', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '53,272', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '53,276', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '54,768', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '54,768', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '54,768', 'INFO', 'create_model_container', '19']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', 'master_model_container', '19']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', 'display_container', '20']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', '']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'create_model(estimator=rf, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '54,786', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '54,787', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '54,787', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '54,788', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '54,788', 'INFO', 'Random Forest Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '54,789', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '54,790', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '54,792', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '55,056', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '55,173', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '55,173', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '55,183', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '55,185', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '55,444', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '55,811', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '56,191', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '56,303', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '56,303', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '56,310', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '56,311', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '56,564', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '56,678', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '56,678', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '56,684', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '56,685', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '56,948', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '57,053', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '57,055', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '57,066', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '57,066', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '57,232', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '57,338', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '57,338', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '57,348', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '57,349', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '57,609', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '57,724', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '57,724', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '57,726', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '57,740', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '57,980', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '58,350', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,456', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,456', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,464', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '58,465', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '58,469', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'create_model_container', '20']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'master_model_container', '20']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'display_container', '21']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', \"RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '58,766', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '58,767', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '58,768', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '58,768', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '58,768', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '46', '58,769', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '58,770', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '58,772', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '58,848', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,848', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,848', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,864', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '58,864', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '58,926', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,942', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,942', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,942', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '58,958', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,037', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,041', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,041', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,053', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '59,055', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,148', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,152', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,153', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,164', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '59,166', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,250', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,250', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,250', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,265', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '59,265', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,359', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,375', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,375', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,375', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '59,390', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,492', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,497', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,497', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,510', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '59,513', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,629', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,634', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,634', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,649', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '59,652', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,760', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,765', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,765', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,778', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '59,780', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,935', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,941', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,941', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,956', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '59,959', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '59,969', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '47', '00,131', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '47', '00,131', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '47', '00,131', 'INFO', 'create_model_container', '21']\n", - "['2020-07-31 08', '47', '00,132', 'INFO', 'master_model_container', '21']\n", - "['2020-07-31 08', '47', '00,132', 'INFO', 'display_container', '22']\n", - "['2020-07-31 08', '47', '00,133', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '47', '00,133', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '00,133', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 08', '47', '00,231', 'INFO', 'create_model_container', '21']\n", - "['2020-07-31 08', '47', '00,231', 'INFO', 'master_model_container', '21']\n", - "['2020-07-31 08', '47', '00,231', 'INFO', 'display_container', '23']\n", - "['2020-07-31 08', '47', '00,233', 'INFO', \"[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 08', '47', '00,233', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '00,241', 'INFO', 'Initializing stack_models()']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', \"stack_models(estimator_list=[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)], meta_model=None, fold=10, round=4, restack=True, plot=False, choose_better=False, optimize=R2, finalize=False, verbose=True)']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', 'Copying estimator list']\n", - "['2020-07-31 08', '47', '00,296', 'INFO', 'Defining meta model']\n", - "['2020-07-31 08', '47', '00,299', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '00,346', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '00,348', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '47', '00,349', 'INFO', 'Getting model names']\n", - "['2020-07-31 08', '47', '00,356', 'INFO', 'Checking base model', 'XGBRegressor']\n", - "['2020-07-31 08', '47', '00,367', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '00,435', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '01,084', 'INFO', 'Checking base model', 'GradientBoostingRegressor']\n", - "['2020-07-31 08', '47', '01,096', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '01,257', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '02,082', 'INFO', 'Checking base model', 'CatBoostRegressor']\n", - "['2020-07-31 08', '47', '02,097', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '03,663', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '24,424', 'INFO', 'Checking base model', 'RandomForestRegressor']\n", - "['2020-07-31 08', '47', '24,430', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '24,814', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '28,106', 'INFO', 'Checking base model', 'LGBMRegressor']\n", - "['2020-07-31 08', '47', '28,120', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '28,227', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '29,899', 'INFO', 'Base layer complete']\n", - "['2020-07-31 08', '47', '29,916', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '47', '29,919', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '47', '29,935', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '29,942', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '29,948', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '29,990', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '47', '29,999', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,006', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,031', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '47', '30,044', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,052', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,057', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,089', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '47', '30,101', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,108', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,112', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,141', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '47', '30,153', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,158', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,163', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,190', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '47', '30,200', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,206', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,208', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,237', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '47', '30,247', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,253', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,255', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,280', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '47', '30,289', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,296', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,300', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,321', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '47', '30,330', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,335', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,338', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,369', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '47', '30,380', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,387', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,390', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,419', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '47', '30,420', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '47', '30,429', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '47', '30,430', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '47', '30,431', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '47', '30,542', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '30,542', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '30,547', 'INFO', \"save_model(model=[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), True], model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '47', '30,547', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '30,631', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '30,651', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), [XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), True], None]']\n", - "['2020-07-31 08', '47', '30,652', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '30,652', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '31,205', 'INFO', 'create_model_container', '22']\n", - "['2020-07-31 08', '47', '31,205', 'INFO', 'master_model_container', '22']\n", - "['2020-07-31 08', '47', '31,205', 'INFO', 'display_container', '24']\n", - "['2020-07-31 08', '47', '31,209', 'INFO', \"[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), True]']\n", - "['2020-07-31 08', '47', '31,209', 'INFO', 'stack_models() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '31,222', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '31,223', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=residuals, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '31,223', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '31,224', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '31,224', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '31,239', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '31,240', 'INFO', 'plot type', 'residuals']\n", - "['2020-07-31 08', '47', '31,385', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '31,427', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 08', '47', '32,278', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,279', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,288', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '32,289', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=error, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '32,289', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,289', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '32,290', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '32,300', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,301', 'INFO', 'plot type', 'error']\n", - "['2020-07-31 08', '47', '32,302', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '32,303', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 08', '47', '32,533', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,533', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,540', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '32,541', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=feature, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '32,541', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,541', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '32,541', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '32,551', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,552', 'INFO', 'plot type', 'feature']\n", - "['2020-07-31 08', '47', '32,696', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,697', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,721', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '32,722', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=parameter, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '32,722', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,722', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '32,722', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '32,731', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,732', 'INFO', 'plot type', 'parameter']\n", - "['2020-07-31 08', '47', '32,740', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,740', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,751', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 08', '47', '32,752', 'INFO', \"interpret_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), plot=summary, feature=None, observation=None)']\n", - "['2020-07-31 08', '47', '32,752', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,946', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,946', 'INFO', 'plot type', 'summary']\n", - "['2020-07-31 08', '47', '32,946', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 08', '47', '33,221', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 08', '47', '33,761', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '33,761', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '33,767', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 08', '47', '33,768', 'INFO', \"interpret_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), plot=correlation, feature=None, observation=None)']\n", - "['2020-07-31 08', '47', '33,768', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '33,769', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '33,769', 'INFO', 'plot type', 'correlation']\n", - "['2020-07-31 08', '47', '33,769', 'WARNING', 'No feature passed. Default value of feature used for correlation plot', 'age']\n", - "['2020-07-31 08', '47', '33,769', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 08', '47', '34,080', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 08', '47', '34,387', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '34,387', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '34,395', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 08', '47', '34,396', 'INFO', \"interpret_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), plot=reason, feature=None, observation=12)']\n", - "['2020-07-31 08', '47', '34,396', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '34,397', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '34,397', 'INFO', 'plot type', 'reason']\n", - "['2020-07-31 08', '47', '34,398', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 08', '47', '34,661', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 08', '47', '34,753', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '34,754', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '34,811', 'INFO', 'Initializing automl()']\n", - "['2020-07-31 08', '47', '34,812', 'INFO', 'automl(optimize=MAE, use_holdout=False)']\n", - "['2020-07-31 08', '47', '34,812', 'INFO', 'Model Selection Basis', 'CV Results on Training set']\n", - "['2020-07-31 08', '47', '34,820', 'INFO', 'SubProcess finalize_model() called ==================================']\n", - "['2020-07-31 08', '47', '34,821', 'INFO', 'Initializing finalize_model()']\n", - "['2020-07-31 08', '47', '34,822', 'INFO', 'finalize_model(estimator=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123))']\n", - "['2020-07-31 08', '47', '34,822', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '34,822', 'INFO', 'Getting model name']\n", - "['2020-07-31 08', '47', '34,823', 'INFO', 'Finalizing AdaBoost Regressor']\n", - "['2020-07-31 08', '47', '34,883', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '47', '34,935', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 08', '47', '34,936', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'create_model(estimator=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '34,953', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '47', '34,954', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '34,954', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '47', '34,954', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '47', '34,955', 'INFO', 'Declaring custom model']\n", - "['2020-07-31 08', '47', '34,956', 'INFO', 'AdaBoost Regressor Imported succesfully']\n", - "['2020-07-31 08', '47', '34,957', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '47', '34,958', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '47', '34,961', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,005', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,008', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,015', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '47', '35,016', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,074', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,078', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,079', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,088', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '47', '35,089', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,141', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,145', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,146', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,153', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '47', '35,154', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,201', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,204', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,204', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,211', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '47', '35,213', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,259', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,262', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,262', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,269', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '47', '35,270', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,312', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,316', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,316', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,322', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '47', '35,324', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,365', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,369', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,375', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '47', '35,376', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,417', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,420', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,420', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,426', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '47', '35,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,468', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,471', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,471', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,477', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '47', '35,478', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,518', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,521', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,521', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,527', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '47', '35,528', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '47', '35,532', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'create_model_container', '23']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'master_model_container', '23']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'display_container', '25']\n", - "['2020-07-31 08', '47', '35,576', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '35,576', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,576', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 08', '47', '35,635', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '35,636', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '35,637', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '47', '35,637', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '35,647', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '35,653', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '47', '35,653', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,653', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '35,712', 'INFO', 'create_model_container', '23']\n", - "['2020-07-31 08', '47', '35,712', 'INFO', 'master_model_container', '23']\n", - "['2020-07-31 08', '47', '35,712', 'INFO', 'display_container', '25']\n", - "['2020-07-31 08', '47', '35,713', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '35,713', 'INFO', 'finalize_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,713', 'INFO', 'SubProcess finalize_model() end ==================================']\n", - "['2020-07-31 08', '47', '35,714', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '35,715', 'INFO', 'automl() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,914', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '35,916', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=best-model, verbose=True)']\n", - "['2020-07-31 08', '47', '35,916', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '35,932', 'INFO', 'best-model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '35,942', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '47', '35,942', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '36,014', 'INFO', 'Initializing deploy_model()']\n", - "['2020-07-31 08', '47', '36,016', 'INFO', 'deploy_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "[\"random_state=123), model_name=best-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", - "['2020-07-31 08', '47', '36,019', 'INFO', 'Platform', 'AWS S3']\n", - "['2020-07-31 08', '47', '36,202', 'INFO', 'Saving model in active working directory']\n", - "['2020-07-31 08', '47', '36,202', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '36,203', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '36,204', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=best-aws, verbose=False)']\n", - "['2020-07-31 08', '47', '36,204', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '36,214', 'INFO', 'best-aws.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', 'Initializing S3 client']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'PyCaret Clustering Module']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'version 2.0']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'USI', '872d']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'setup(data=(224, 21), categorical_features=None, categorical_imputation=constant, ordinal_features=None, high_cardinality_features=None,']\n", - "[\"numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=['Country Name'], normalize=False,\"]\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, group_features=None,']\n", - "['group_names=None, supervised=False, supervised_target=None, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=health1, log_plots=True, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'Checking environment']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Memory', 'svmem(total=17032478720, available=10622828544, percent=37.6, used=6409650176, free=10622828544)']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Checking libraries']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 08', '47', '37,218', 'INFO', 'sklearn==0.23.1']\n", - "['2020-07-31 08', '47', '37,223', 'INFO', 'kmodes==0.10.1']\n", - "['2020-07-31 08', '47', '37,758', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '37,758', 'INFO', 'deploy_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'get_config(variable=X_train)']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'Global variable', 'X_train returned']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,795', 'INFO', 'Initializing set_config()']\n", - "['2020-07-31 08', '47', '37,795', 'INFO', 'set_config(variable=seed, value=999)']\n", - "['2020-07-31 08', '47', '37,795', 'INFO', 'Global variable', 'seed updated']\n", - "['2020-07-31 08', '47', '37,796', 'INFO', 'set_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '38,740', 'INFO', 'mlflow==1.8.0']\n", - "['2020-07-31 08', '47', '38,741', 'INFO', 'Checking Exceptions']\n", - "['2020-07-31 08', '47', '38,741', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '38,741', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '38,760', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '38,761', 'INFO', 'Declaring global variables']\n", - "['2020-07-31 08', '47', '38,761', 'INFO', 'Copying data for preprocessing']\n", - "['2020-07-31 08', '47', '38,767', 'INFO', 'Declaring preprocessing parameters']\n", - "['2020-07-31 08', '47', '38,767', 'INFO', 'Importing preprocessing module']\n", - "['2020-07-31 08', '47', '40,016', 'INFO', 'Creating preprocessing pipeline']\n", - "['2020-07-31 08', '47', '40,955', 'INFO', 'Preprocessing pipeline created successfully']\n", - "['2020-07-31 08', '47', '40,955', 'INFO', 'Creating grid variables']\n", - "['2020-07-31 08', '47', '40,957', 'INFO', 'Creating global containers']\n", - "['2020-07-31 08', '47', '41,398', 'INFO', 'Logging experiment in MLFlow']\n", - "['2020-07-31 08', '47', '41,542', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '41,543', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '41,555', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", - "['2020-07-31 08', '47', '41,555', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '41,565', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '41,580', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False), Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False)]']\n", - "['2020-07-31 08', '47', '41,580', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '41,580', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '41,699', 'INFO', 'Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False)']\n", - "['2020-07-31 08', '47', '41,699', 'INFO', 'setup() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '41,768', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '47', '41,768', 'INFO', 'create_model(model=kmeans, num_clusters=4, ground_truth=None, verbose=True, system=True)']\n", - "['2020-07-31 08', '47', '41,769', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '41,769', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '41,769', 'INFO', 'Setting num_cluster param']\n", - "['2020-07-31 08', '47', '41,769', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '41,790', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 08', '47', '41,790', 'INFO', 'K-Means Clustering Imported succesfully']\n", - "['2020-07-31 08', '47', '41,796', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '41,892', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '41,915', 'INFO', 'Creating Metrics dataframe']\n", - "['2020-07-31 08', '47', '41,917', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '47', '42,047', 'INFO', 'SubProcess plot_model() called ==================================']\n", - "['2020-07-31 08', '47', '42,047', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '42,048', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '42,048', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '42,048', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '43,583', 'INFO', 'plot type', 'cluster']\n", - "['2020-07-31 08', '47', '43,583', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '47', '43,584', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '47', '43,584', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", - "['2020-07-31 08', '47', '43,585', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '43,585', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '43,585', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '47', '43,585', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", - "['2020-07-31 08', '47', '43,585', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '43,602', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '47', '43,603', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '47', '43,603', 'INFO', '(224, 21)']\n", - "['2020-07-31 08', '47', '43,603', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '43,603', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '47', '43,612', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 08', '47', '43,620', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '47', '43,623', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '47', '47,566', 'INFO', \"Saving 'Cluster.html' in current active directory\"]\n", - "['2020-07-31 08', '47', '47,566', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '47,566', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '47,921', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '47,921', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=distribution, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '47,921', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '47,921', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '47,932', 'INFO', 'plot type', 'distribution']\n", - "['2020-07-31 08', '47', '47,932', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '47', '47,932', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '47', '47,933', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=False)']\n", - "['2020-07-31 08', '47', '47,933', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '47,933', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '47,933', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '47', '47,933', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '47,946', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '47', '47,946', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '47', '47,946', 'INFO', '(224, 22)']\n", - "['2020-07-31 08', '47', '47,947', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '47,947', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '47', '47,947', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '47', '47,953', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '47', '48,750', 'INFO', \"Saving 'Distribution.html' in current active directory\"]\n", - "['2020-07-31 08', '47', '48,750', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '48,750', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '49,086', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '49,087', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=elbow, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '49,087', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '49,087', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '49,099', 'INFO', 'plot type', 'elbow']\n", - "['2020-07-31 08', '47', '49,361', 'INFO', 'Fitting KElbowVisualizer()']\n", - "['2020-07-31 08', '47', '49,949', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '47', '50,717', 'INFO', \"Saving 'Elbow.png' in current active directory\"]\n", - "['2020-07-31 08', '47', '50,717', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '50,717', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '50,729', 'INFO', 'SubProcess plot_model() end ==================================']\n", - "['2020-07-31 08', '47', '50,730', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '50,730', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '50,731', 'INFO', \"save_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '47', '50,731', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '50,737', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '50,744', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0)]']\n", - "['2020-07-31 08', '47', '50,744', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '50,744', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '50,783', 'INFO', \"KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0)']\n", - "['2020-07-31 08', '47', '50,784', 'INFO', 'create_models() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '50,796', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '47', '50,796', 'INFO', 'create_model(model=kmodes, num_clusters=4, ground_truth=None, verbose=True, system=True)']\n", - "['2020-07-31 08', '47', '50,796', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '50,797', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '50,797', 'INFO', 'Setting num_cluster param']\n", - "['2020-07-31 08', '47', '50,797', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '50,827', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 08', '47', '50,834', 'INFO', 'K-Modes Clustering Imported succesfully']\n", - "['2020-07-31 08', '47', '50,842', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '52,734', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '52,751', 'INFO', 'Creating Metrics dataframe']\n", - "['2020-07-31 08', '47', '52,753', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '47', '52,890', 'INFO', 'SubProcess plot_model() called ==================================']\n", - "['2020-07-31 08', '47', '52,891', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '52,891', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), plot=cluster, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '52,892', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '52,892', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '52,905', 'INFO', 'plot type', 'cluster']\n", - "['2020-07-31 08', '47', '52,905', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '47', '52,906', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '47', '52,907', 'INFO', \"assign_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), transformation=True, verbose=False)']\n", - "['2020-07-31 08', '47', '52,907', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '52,907', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '52,907', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '47', '52,908', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", - "['2020-07-31 08', '47', '52,908', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '52,926', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '47', '52,927', 'INFO', 'Trained Model', 'K-Modes Clustering']\n", - "['2020-07-31 08', '47', '52,927', 'INFO', '(224, 21)']\n", - "['2020-07-31 08', '47', '52,927', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '52,928', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '47', '52,935', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 08', '47', '52,945', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '47', '52,949', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '47', '53,559', 'INFO', \"Saving 'Cluster.html' in current active directory\"]\n", - "['2020-07-31 08', '47', '53,559', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '53,559', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '53,925', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '53,926', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), plot=distribution, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '53,926', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '53,926', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '53,939', 'INFO', 'plot type', 'distribution']\n", - "['2020-07-31 08', '47', '53,939', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '47', '53,939', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '47', '53,940', 'INFO', \"assign_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), transformation=False, verbose=False)']\n", - "['2020-07-31 08', '47', '53,940', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '53,940', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '53,940', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '47', '53,940', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '53,958', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '47', '53,959', 'INFO', 'Trained Model', 'K-Modes Clustering']\n", - "['2020-07-31 08', '47', '53,959', 'INFO', '(224, 22)']\n", - "['2020-07-31 08', '47', '53,959', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '53,959', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '47', '53,960', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '47', '53,967', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '47', '54,761', 'INFO', \"Saving 'Distribution.html' in current active directory\"]\n", - "['2020-07-31 08', '47', '54,761', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '54,761', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '55,112', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '55,113', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), plot=elbow, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '55,113', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '55,113', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '55,125', 'INFO', 'plot type', 'elbow']\n", - "['2020-07-31 08', '47', '55,145', 'INFO', 'Fitting KElbowVisualizer()']\n", - "['2020-07-31 08', '48', '00,303', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '00,447', 'INFO', \"Saving 'Elbow.png' in current active directory\"]\n", - "['2020-07-31 08', '48', '00,447', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '00,447', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '00,458', 'INFO', 'SubProcess plot_model() end ==================================']\n", - "['2020-07-31 08', '48', '00,458', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '48', '00,459', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '48', '00,459', 'INFO', \"save_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '48', '00,459', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '48', '00,581', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '48', '00,586', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0)]']\n", - "['2020-07-31 08', '48', '00,587', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '00,587', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '48', '00,619', 'INFO', \"KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0)']\n", - "['2020-07-31 08', '48', '00,619', 'INFO', 'create_models() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '03,231', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '48', '03,231', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=True)']\n", - "['2020-07-31 08', '48', '03,232', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '03,232', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '48', '03,232', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '48', '03,232', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '48', '03,262', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '48', '03,262', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '48', '03,263', 'INFO', '(224, 22)']\n", - "['2020-07-31 08', '48', '03,264', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '04,898', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '04,898', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '04,899', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '04,899', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '04,909', 'INFO', 'plot type', 'cluster']\n", - "['2020-07-31 08', '48', '04,909', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '48', '04,909', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '48', '04,910', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", - "['2020-07-31 08', '48', '04,910', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '04,910', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '48', '04,910', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '48', '04,911', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", - "['2020-07-31 08', '48', '04,911', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '48', '04,927', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '48', '04,927', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '48', '04,927', 'INFO', '(224, 21)']\n", - "['2020-07-31 08', '48', '04,927', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '04,928', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '48', '04,931', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 08', '48', '04,936', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '48', '04,938', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '05,369', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '05,369', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '07,179', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '07,180', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=Country Name, label=True, save=False, system=True)']\n", - "['2020-07-31 08', '48', '07,180', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '07,180', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '07,187', 'INFO', 'plot type', 'cluster']\n", - "['2020-07-31 08', '48', '07,187', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '48', '07,188', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '48', '07,188', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", - "['2020-07-31 08', '48', '07,188', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '07,189', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '48', '07,189', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '48', '07,189', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", - "['2020-07-31 08', '48', '07,189', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '48', '07,199', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '48', '07,200', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '48', '07,200', 'INFO', '(224, 21)']\n", - "['2020-07-31 08', '48', '07,200', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '07,200', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '48', '07,204', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 08', '48', '07,207', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '48', '07,209', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '07,466', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '07,466', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '08,323', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '08,324', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=tsne, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '08,324', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '08,324', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '08,334', 'INFO', 'plot type', 'tsne']\n", - "['2020-07-31 08', '48', '08,334', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '48', '08,334', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '48', '08,343', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '48', '08,344', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '48', '08,344', 'INFO', '(224, 21)']\n", - "['2020-07-31 08', '48', '08,344', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '08,344', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '48', '08,345', 'INFO', 'Fitting TSNE()']\n", - "['2020-07-31 08', '48', '10,591', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '48', '10,600', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '11,151', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '11,151', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '11,158', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '11,159', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=elbow, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '11,159', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '11,159', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '11,168', 'INFO', 'plot type', 'elbow']\n", - "['2020-07-31 08', '48', '11,169', 'INFO', 'Fitting KElbowVisualizer()']\n", - "['2020-07-31 08', '48', '11,704', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '11,875', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '11,875', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '11,882', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '11,883', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=silhouette, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '11,883', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '11,883', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '11,893', 'INFO', 'plot type', 'silhouette']\n", - "['2020-07-31 08', '48', '11,893', 'INFO', 'Fitting SilhouetteVisualizer()']\n", - "['2020-07-31 08', '48', '11,976', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '12,124', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '12,124', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '12,130', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '12,131', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=distance, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '12,131', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '12,132', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '12,142', 'INFO', 'plot type', 'distance']\n", - "['2020-07-31 08', '48', '12,163', 'INFO', 'Fitting InterclusterDistance()']\n", - "['2020-07-31 08', '48', '12,187', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '12,317', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '12,317', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '12,325', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '12,325', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=distribution, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '12,325', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '12,325', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '12,334', 'INFO', 'plot type', 'distribution']\n", - "['2020-07-31 08', '48', '12,335', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '48', '12,335', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '48', '12,336', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=False)']\n", - "['2020-07-31 08', '48', '12,336', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '12,336', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '48', '12,336', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '48', '12,336', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', '(224, 22)']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '48', '12,351', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '12,781', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '12,781', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '16,227', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '48', '16,228', 'INFO', \"save_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), model_name=kmeans, verbose=True)']\n", - "['2020-07-31 08', '48', '16,228', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '48', '16,239', 'INFO', 'kmeans.pkl saved in current working directory']\n", - "['2020-07-31 08', '48', '16,246', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0)]']\n", - "['2020-07-31 08', '48', '16,246', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '19,081', 'INFO', 'Initializing deploy_model()']\n", - "['2020-07-31 08', '48', '19,081', 'INFO', \"deploy_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "[\"random_state=123, tol=0.0001, verbose=0), model_name=kmeans-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", - "['2020-07-31 08', '48', '19,081', 'INFO', 'Platform', 'AWS S3']\n", - "['2020-07-31 08', '48', '19,264', 'INFO', 'Saving model in current working directory']\n", - "['2020-07-31 08', '48', '19,265', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '48', '19,265', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '48', '19,265', 'INFO', \"save_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), model_name=kmeans-aws, verbose=False)']\n", - "['2020-07-31 08', '48', '19,265', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '48', '19,269', 'INFO', 'kmeans-aws.pkl saved in current working directory']\n", - "['2020-07-31 08', '48', '19,273', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0)]']\n", - "['2020-07-31 08', '48', '19,273', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '19,273', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '48', '19,273', 'INFO', 'Initializing S3 client']\n", - "['2020-07-31 08', '48', '20,241', 'INFO', \"KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0)']\n", - "['2020-07-31 08', '48', '20,242', 'INFO', 'deploy_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '20,588', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '48', '20,588', 'INFO', 'get_config(variable=X)']\n", - "['2020-07-31 08', '48', '20,589', 'INFO', 'Global variable', 'X returned']\n", - "['2020-07-31 08', '48', '20,589', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '21,288', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '48', '21,288', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '48', '21,288', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '48', '21,289', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '21,687', 'INFO', 'Initializing set_config()']\n", - "['2020-07-31 08', '48', '21,687', 'INFO', 'set_config(variable=seed, value=999)']\n", - "['2020-07-31 08', '48', '21,687', 'INFO', 'Global variable', 'seed updated']\n", - "['2020-07-31 08', '48', '21,687', 'INFO', 'set_config() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '22,013', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '48', '22,013', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '48', '22,013', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '48', '22,013', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '02,210', 'INFO', 'PyCaret Anomaly Detection Module']\n", - "['2020-07-31 08', '49', '02,210', 'INFO', 'version 2.0']\n", - "['2020-07-31 08', '49', '02,210', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 08', '49', '02,210', 'INFO', 'USI', '4197']\n", - "['2020-07-31 08', '49', '02,210', 'INFO', 'setup(data=(1000, 10), categorical_features=None, categorical_imputation=constant, ordinal_features=None, high_cardinality_features=None,']\n", - "['numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, group_features=None,']\n", - "['group_names=None, supervised=False, supervised_target=None, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=anomaly1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 08', '49', '02,210', 'INFO', 'Checking environment']\n", - "['2020-07-31 08', '49', '02,211', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 08', '49', '02,211', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 08', '49', '02,211', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 08', '49', '02,211', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 08', '49', '02,222', 'INFO', 'Memory', 'svmem(total=17032478720, available=9700515840, percent=43.0, used=7331962880, free=9700515840)']\n", - "['2020-07-31 08', '49', '02,222', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 08', '49', '02,222', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 08', '49', '02,222', 'INFO', 'Checking libraries']\n", - "['2020-07-31 08', '49', '02,222', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 08', '49', '02,222', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 08', '49', '03,371', 'WARNING', 'pyod not found']\n", - "['2020-07-31 08', '49', '03,997', 'INFO', 'mlflow==1.8.0']\n", - "['2020-07-31 08', '49', '03,997', 'INFO', 'Checking Exceptions']\n", - "['2020-07-31 08', '49', '03,997', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '49', '03,997', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '49', '04,013', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '49', '04,013', 'INFO', 'Declaring global variables']\n", - "['2020-07-31 08', '49', '04,013', 'INFO', 'Copying data for preprocessing']\n", - "['2020-07-31 08', '49', '04,025', 'INFO', 'Declaring preprocessing parameters']\n", - "['2020-07-31 08', '49', '04,025', 'INFO', 'Importing preprocessing module']\n", - "['2020-07-31 08', '49', '04,304', 'INFO', 'Creating preprocessing pipeline']\n", - "['2020-07-31 08', '49', '05,209', 'INFO', 'Preprocessing pipeline created successfully']\n", - "['2020-07-31 08', '49', '05,209', 'INFO', 'Creating grid variables']\n", - "['2020-07-31 08', '49', '05,210', 'INFO', 'Creating global containers']\n", - "['2020-07-31 08', '49', '05,433', 'INFO', 'Logging experiment in MLFlow']\n", - "['2020-07-31 08', '49', '05,525', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '49', '05,526', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '49', '05,530', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", - "['2020-07-31 08', '49', '05,530', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '49', '05,531', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", - "['2020-07-31 08', '49', '05,531', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False), Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False)]']\n", - "['2020-07-31 08', '49', '05,531', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '05,531', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '49', '05,578', 'INFO', 'Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False)']\n", - "['2020-07-31 08', '49', '05,578', 'INFO', 'setup() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '07,799', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '49', '07,799', 'INFO', 'create_model(model=iforest, fraction=0.05, verbose=True, system=True)']\n", - "['2020-07-31 08', '49', '07,799', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '49', '07,799', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '49', '07,800', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '49', '07,820', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 08', '49', '07,820', 'INFO', 'Isolation Forest Imported succesfully']\n", - "['2020-07-31 08', '49', '07,824', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '49', '08,071', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '49', '08,127', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '49', '08,128', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '49', '08,128', 'INFO', \"save_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '49', '08,128', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '49', '08,161', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '49', '08,165', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0)]']\n", - "['2020-07-31 08', '49', '08,165', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '08,166', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '49', '08,194', 'INFO', \"IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0)']\n", - "['2020-07-31 08', '49', '08,194', 'INFO', 'create_models() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '08,621', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '49', '08,621', 'INFO', 'create_model(model=knn, fraction=0.1, verbose=True, system=True)']\n", - "['2020-07-31 08', '49', '08,621', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '49', '08,621', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '49', '08,621', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '49', '08,640', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 08', '49', '08,640', 'INFO', 'k-Nearest Neighbors Detector Imported succesfully']\n", - "['2020-07-31 08', '49', '08,644', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '49', '08,665', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '49', '08,722', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '49', '08,722', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '49', '08,722', 'INFO', \"save_model(model=KNN(algorithm='auto', contamination=0.1, leaf_size=30, method='largest',\"]\n", - "[\"metric='minkowski', metric_params=None, n_jobs=1, n_neighbors=5, p=2,\"]\n", - "['radius=1.0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '49', '08,722', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '49', '08,727', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '49', '08,731', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), KNN(algorithm='auto', contamination=0.1, leaf_size=30, method='largest',\"]\n", - "[\"metric='minkowski', metric_params=None, n_jobs=1, n_neighbors=5, p=2,\"]\n", - "['radius=1.0)]']\n", - "['2020-07-31 08', '49', '08,731', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '08,731', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '49', '08,749', 'INFO', \"KNN(algorithm='auto', contamination=0.1, leaf_size=30, method='largest',\"]\n", - "[\"metric='minkowski', metric_params=None, n_jobs=1, n_neighbors=5, p=2,\"]\n", - "['radius=1.0)']\n", - "['2020-07-31 08', '49', '08,749', 'INFO', 'create_models() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '10,079', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '49', '10,080', 'INFO', \"assign_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0), transformation=False, score=True, verbose=True)']\n", - "['2020-07-31 08', '49', '10,080', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '49', '10,080', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '49', '10,081', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '49', '10,102', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '49', '10,102', 'INFO', 'Trained Model', 'Assigned Isolation Forest']\n", - "['2020-07-31 08', '49', '10,103', 'INFO', '(1000, 12)']\n", - "['2020-07-31 08', '49', '10,103', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '10,451', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '49', '10,451', 'INFO', \"plot_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0), plot=tsne, feature=None, save=False, system=True)']\n", - "['2020-07-31 08', '49', '10,452', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '49', '10,452', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '49', '11,185', 'INFO', 'plot type', 'tsne']\n", - "['2020-07-31 08', '49', '11,185', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '49', '11,185', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '49', '11,185', 'INFO', \"assign_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0), transformation=True, score=False, verbose=False)']\n", - "['2020-07-31 08', '49', '11,185', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '49', '11,187', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '49', '11,187', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '49', '11,196', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '49', '11,196', 'INFO', 'Trained Model', 'Assigned Isolation Forest']\n", - "['2020-07-31 08', '49', '11,196', 'INFO', '(1000, 11)']\n", - "['2020-07-31 08', '49', '11,196', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '11,196', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '49', '11,203', 'INFO', 'Getting dummies to cast categorical variables']\n", - "['2020-07-31 08', '49', '11,206', 'INFO', 'Fitting TSNE()']\n", - "['2020-07-31 08', '49', '23,129', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '49', '24,132', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '49', '24,132', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '24,145', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '49', '24,145', 'INFO', \"plot_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0), plot=umap, feature=None, save=False, system=True)']\n", - "['2020-07-31 08', '49', '24,145', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '49', '24,145', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '49', '24,152', 'INFO', 'plot type', 'umap']\n", - "['2020-07-31 08', '49', '24,153', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '49', '24,153', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '49', '24,153', 'INFO', \"assign_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0), transformation=True, score=False, verbose=False)']\n", - "['2020-07-31 08', '49', '24,153', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '49', '24,153', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '49', '24,154', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '49', '24,163', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '49', '24,164', 'INFO', 'Trained Model', 'Assigned Isolation Forest']\n", - "['2020-07-31 08', '49', '24,164', 'INFO', '(1000, 11)']\n", - "['2020-07-31 08', '49', '24,164', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '24,164', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '49', '24,168', 'INFO', 'Getting dummies to cast categorical variables']\n", - "['2020-07-31 08', '49', '26,562', 'INFO', 'Fitting UMAP()']\n", - "['2020-07-31 08', '49', '29,832', 'INFO', 'PyCaret NLP Module']\n", - "['2020-07-31 08', '49', '29,832', 'INFO', 'version 2.0']\n", - "['2020-07-31 08', '49', '29,832', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 08', '49', '29,832', 'INFO', 'USI', 'a367']\n", - "['2020-07-31 08', '49', '29,832', 'INFO', 'setup(data=(6818, 7), target=en, custom_stopwords=None, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=kiva1, log_plots=True, log_data=False, verbose=True)']\n", - "['2020-07-31 08', '49', '29,832', 'INFO', 'Checking environment']\n", - "['2020-07-31 08', '49', '29,832', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 08', '49', '29,832', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 08', '49', '29,832', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 08', '49', '29,832', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 08', '49', '29,843', 'INFO', 'Memory', 'svmem(total=17032478720, available=9347919872, percent=45.1, used=7684558848, free=9347919872)']\n", - "['2020-07-31 08', '49', '29,843', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 08', '49', '29,843', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 08', '49', '29,843', 'INFO', 'Checking libraries']\n", - "['2020-07-31 08', '49', '29,843', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 08', '49', '29,843', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 08', '49', '31,272', 'INFO', 'gensim==3.8.1']\n", - "['2020-07-31 08', '49', '31,774', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '49', '32,164', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '49', '32,164', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '32,371', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '49', '32,372', 'INFO', \"save_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0), model_name=iforest, verbose=True)']\n", - "['2020-07-31 08', '49', '32,372', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '49', '32,421', 'INFO', 'iforest.pkl saved in current working directory']\n", - "['2020-07-31 08', '49', '32,425', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0)]']\n", - "['2020-07-31 08', '49', '32,425', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '32,534', 'INFO', 'Initializing deploy_model()']\n", - "['2020-07-31 08', '49', '32,534', 'INFO', \"deploy_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "[\"random_state=123, verbose=0), model_name=iforest-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", - "['2020-07-31 08', '49', '32,534', 'INFO', 'Platform', 'AWS S3']\n", - "['2020-07-31 08', '49', '32,597', 'INFO', 'Saving model in current working directory']\n", - "['2020-07-31 08', '49', '32,597', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '49', '32,597', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '49', '32,597', 'INFO', \"save_model(model=IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0), model_name=iforest-aws, verbose=False)']\n", - "['2020-07-31 08', '49', '32,597', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '49', '32,644', 'INFO', 'iforest-aws.pkl saved in current working directory']\n", - "['2020-07-31 08', '49', '32,659', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0)]']\n", - "['2020-07-31 08', '49', '32,659', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '32,659', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '49', '32,659', 'INFO', 'Initializing S3 client']\n", - "['2020-07-31 08', '49', '34,328', 'INFO', \"IForest(behaviour='new', bootstrap=False, contamination=0.05,\"]\n", - "[\"max_features=1.0, max_samples='auto', n_estimators=100, n_jobs=1,\"]\n", - "['random_state=123, verbose=0)']\n", - "['2020-07-31 08', '49', '34,328', 'INFO', 'deploy_model() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '34,347', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '49', '34,349', 'INFO', 'get_config(variable=X)']\n", - "['2020-07-31 08', '49', '34,349', 'INFO', 'Global variable', 'X returned']\n", - "['2020-07-31 08', '49', '34,349', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '34,394', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '49', '34,394', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '49', '34,395', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '49', '34,395', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '34,404', 'INFO', 'Initializing set_config()']\n", - "['2020-07-31 08', '49', '34,404', 'INFO', 'set_config(variable=seed, value=999)']\n", - "['2020-07-31 08', '49', '34,404', 'INFO', 'Global variable', 'seed updated']\n", - "['2020-07-31 08', '49', '34,404', 'INFO', 'set_config() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '34,419', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '49', '34,419', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '49', '34,419', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '49', '34,419', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '49', '34,430', 'INFO', 'spacy==2.2.3']\n" - ] - } - ], - "source": [ - "get_system_logs()" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# 11. MLFlow UI" + "# 10. MLFlow UI" ] }, { diff --git a/examples/PyCaret 2 Classification.ipynb b/examples/PyCaret 2 Classification.ipynb index 090a0641121cab28df37ebfc0cd3d4958dc31734..0718bb5521249096718cbe890d383055304ecd96 100644 --- a/examples/PyCaret 2 Classification.ipynb +++ b/examples/PyCaret 2 Classification.ipynb @@ -4952,3303 +4952,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "# 16. Get System Logs" - ] - }, - { - "cell_type": "code", - "execution_count": 40, - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '40', '51,509', 'INFO', 'PyCaret Classification Module']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'version 2.0']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'USI', '1cda']\n", - "['2020-07-31 01', '40', '51,510', 'INFO', 'setup(data=(1070, 19), target=Purchase, train_size=0.7, sampling=True, sample_estimator=None, categorical_features=None, categorical_imputation=constant, ordinal_features=None,']\n", - "['high_cardinality_features=None, high_cardinality_method=frequency, numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None, remove_outliers=False, outliers_threshold=0.05,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, remove_perfect_collinearity=False, create_clusters=False, cluster_iter=20,']\n", - "['polynomial_features=False, polynomial_degree=2, trigonometry_features=False, polynomial_threshold=0.1, group_features=None,']\n", - "['group_names=None, feature_selection=False, feature_selection_threshold=0.8, feature_interaction=False, feature_ratio=False, interaction_threshold=0.01,']\n", - "['fix_imbalance=False, fix_imbalance_method=None, data_split_shuffle=True, folds_shuffle=False, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=juice1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 01', '40', '51,526', 'INFO', 'Checking environment']\n", - "['2020-07-31 01', '40', '51,526', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Memory', 'svmem(total=17032478720, available=12121403392, percent=28.8, used=4911075328, free=12121403392)']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Checking libraries']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 01', '40', '55,335', 'INFO', 'sklearn==0.23.1']\n", - "['2020-07-31 01', '40', '55,728', 'INFO', 'xgboost==0.90']\n", - "['2020-07-31 01', '40', '56,084', 'INFO', 'lightgbm==2.3.1']\n", - "['2020-07-31 01', '40', '56,736', 'INFO', 'catboost==0.20.2']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'mlflow==1.8.0']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Checking Exceptions']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '41', '00,697', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '41', '10,136', 'INFO', 'Copying data for preprocessing']\n", - "['2020-07-31 01', '41', '10,136', 'INFO', 'Declaring global variables']\n", - "['2020-07-31 01', '41', '10,162', 'INFO', 'Declaring preprocessing parameters']\n", - "['2020-07-31 01', '41', '10,162', 'INFO', 'Importing preprocessing module']\n", - "['2020-07-31 01', '41', '14,303', 'INFO', 'Creating preprocessing pipeline']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Preprocessing pipeline created successfully']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Creating grid variables']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Creating global containers']\n", - "['2020-07-31 01', '41', '16,270', 'INFO', 'Logging experiment in MLFlow']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False)]']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'create_model_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'master_model_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'display_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['verbose=False)']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'setup() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'compare_models(blacklist=None, whitelist=None, fold=10, round=4, sort=Accuracy, n_select=1, turbo=True, verbose=True)']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '41', '23,820', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '41', '23,820', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '41', '23,838', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '41', '23,839', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '41', '23,910', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 01', '41', '23,922', 'INFO', 'Import successful']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Initializing Logistic Regression']\n", - "['2020-07-31 01', '41', '23,934', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '23,940', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '23,996', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,003', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,007', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '24,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,057', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,064', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,068', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '24,073', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,111', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,118', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,122', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '24,127', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,168', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,174', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,178', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '24,182', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,224', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,230', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,235', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '24,240', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,279', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,286', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,290', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '24,296', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,338', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,345', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,349', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '24,354', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,391', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,398', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,402', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '24,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,447', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,453', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,457', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '24,462', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,503', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,514', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '24,514', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '24,523', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'save_model(model=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '24,644', 'INFO', 'Initializing K Neighbors Classifier']\n", - "['2020-07-31 01', '41', '24,647', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '24,647', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,685', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,905', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,911', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '24,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,922', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,165', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,173', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '25,180', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,185', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,410', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,415', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '25,422', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,427', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,652', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,652', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '25,672', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,676', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,941', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,956', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '25,956', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,972', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,219', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,235', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '26,235', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,249', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,490', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,490', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '26,510', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,514', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,744', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,750', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '26,756', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,760', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '26,998', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,007', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,019', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,243', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,248', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '27,249', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '27,259', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '27,319', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '27,319', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '27,320', 'INFO', \"save_model(model=KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '27,320', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '27,330', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '27,338', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform')]\"]\n", - "['2020-07-31 01', '41', '27,338', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '27,338', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '27,380', 'INFO', 'Initializing Naive Bayes']\n", - "['2020-07-31 01', '41', '27,380', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '27,396', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,398', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,405', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,410', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '27,415', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,418', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,424', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,429', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '27,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,437', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,444', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,449', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '27,455', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,458', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,465', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,469', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '27,475', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,484', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,489', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '27,494', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,504', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,509', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '27,514', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,517', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,525', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,530', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '27,535', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,538', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,545', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,550', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '27,556', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,559', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,566', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,570', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,576', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,585', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,590', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '27,590', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '27,600', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'save_model(model=GaussianNB(priors=None, var_smoothing=1e-09), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), GaussianNB(priors=None, var_smoothing=1e-09)]']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '27,707', 'INFO', 'Initializing Decision Tree Classifier']\n", - "['2020-07-31 01', '41', '27,712', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '27,718', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,766', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,778', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '27,783', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,794', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,799', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '27,806', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,811', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,817', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,825', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '27,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,847', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,853', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '27,860', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,866', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,873', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '27,879', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '27,886', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,891', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,899', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,904', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '27,912', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,917', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,926', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,931', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '27,938', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,944', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,951', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,957', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '27,962', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,967', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,982', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,987', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,993', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,000', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,006', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,006', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,017', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,076', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,076', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,077', 'INFO', \"save_model(model=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '28,077', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,082', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,086', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')]\"]\n", - "['2020-07-31 01', '41', '28,087', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,087', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,135', 'INFO', 'Initializing SVM - Linear Kernel']\n", - "['2020-07-31 01', '41', '28,141', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '28,147', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,188', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,188', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,191', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,193', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,198', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '28,204', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,212', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,215', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,217', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,222', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '28,227', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,235', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,235', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,238', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,240', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,245', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '28,250', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,256', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,256', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,259', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,262', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,266', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '28,272', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,276', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,279', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,281', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,286', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '28,291', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,297', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,297', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,300', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,302', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,307', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '28,312', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,319', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,319', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,322', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,324', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,329', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '28,334', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,341', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,341', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,344', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,346', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,350', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '28,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,364', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,364', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,367', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,374', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '28,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,386', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '28,386', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,389', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,391', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,396', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,396', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,407', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,473', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'save_model(model=SGDClassifier(alpha=0.0001, average=False, class_weight=None,']\n", - "['early_stopping=False, epsilon=0.1, eta0=0.0, fit_intercept=True,']\n", - "[\"l1_ratio=0.15, learning_rate='optimal', loss='hinge',\"]\n", - "[\"max_iter=1000, n_iter_no_change=5, n_jobs=-1, penalty='l2',\"]\n", - "['power_t=0.5, random_state=123, shuffle=True, tol=0.001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,479', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), SGDClassifier(alpha=0.0001, average=False, class_weight=None,']\n", - "['early_stopping=False, epsilon=0.1, eta0=0.0, fit_intercept=True,']\n", - "[\"l1_ratio=0.15, learning_rate='optimal', loss='hinge',\"]\n", - "[\"max_iter=1000, n_iter_no_change=5, n_jobs=-1, penalty='l2',\"]\n", - "['power_t=0.5, random_state=123, shuffle=True, tol=0.001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False)]']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,532', 'INFO', 'Initializing Ridge Classifier']\n", - "['2020-07-31 01', '41', '28,532', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '28,547', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,630', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,630', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,646', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,662', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,662', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,665', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,667', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,676', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '28,683', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,687', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,687', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,690', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,692', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,697', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '28,706', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,711', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,711', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,713', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,715', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,720', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '28,726', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,730', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,730', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,733', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,735', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,739', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '28,744', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,748', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,749', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,751', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,754', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,759', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '28,764', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,768', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,768', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,771', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,778', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '28,784', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,788', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,791', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,793', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,799', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '28,804', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,809', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,809', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,813', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,816', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,821', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '28,827', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,831', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,831', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,834', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,836', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,841', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,841', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,853', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,934', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,935', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,935', 'INFO', 'save_model(model=RidgeClassifier(alpha=1.0, class_weight=None, copy_X=True, fit_intercept=True,']\n", - "[\"max_iter=None, normalize=False, random_state=123, solver='auto',\"]\n", - "['tol=0.001), model_name=Trained Model, verbose=False)']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '28,935', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,940', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RidgeClassifier(alpha=1.0, class_weight=None, copy_X=True, fit_intercept=True,']\n", - "[\"max_iter=None, normalize=False, random_state=123, solver='auto',\"]\n", - "['tol=0.001)]']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,994', 'INFO', 'Initializing Random Forest Classifier']\n", - "['2020-07-31 01', '41', '29,000', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '29,006', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,127', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '29,363', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '29,378', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '29,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,496', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '29,712', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '29,716', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '29,723', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,834', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,077', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,087', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '30,095', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,207', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,439', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,448', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '30,455', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,569', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,799', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,799', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '30,814', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,933', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,175', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '31,183', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '31,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,538', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,547', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '31,553', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '31,666', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,902', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,913', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '31,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,034', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,387', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,626', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,630', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '32,630', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '32,642', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '32,760', 'INFO', 'Initializing Quadratic Discriminant Analysis']\n", - "['2020-07-31 01', '41', '32,776', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '32,776', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,838', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,838', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,948', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '32,948', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,948', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,995', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,995', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '33,010', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,010', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,023', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,029', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '33,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,039', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,045', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,050', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '33,050', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '33,062', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'save_model(model=QuadraticDiscriminantAnalysis(priors=None, reg_param=0.0,']\n", - "['store_covariance=False, tol=0.0001), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), QuadraticDiscriminantAnalysis(priors=None, reg_param=0.0,']\n", - "['store_covariance=False, tol=0.0001)]']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '33,161', 'INFO', 'Initializing Ada Boost Classifier']\n", - "['2020-07-31 01', '41', '33,161', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '33,177', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,239', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,255', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,255', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '33,270', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,333', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,348', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,348', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '33,364', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,427', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,442', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,442', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '33,458', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,520', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,536', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,552', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '33,552', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,614', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,649', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,655', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '33,660', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,730', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,746', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,761', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '33,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,839', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,855', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,855', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '33,871', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,933', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,949', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,964', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '33,964', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,027', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,136', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '34,171', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '34,240', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123)]']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '34,314', 'INFO', 'Initializing Gradient Boosting Classifier']\n", - "['2020-07-31 01', '41', '34,322', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '34,328', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,447', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,455', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,460', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '34,466', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,582', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '34,589', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,594', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '34,600', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,726', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,733', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,739', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '34,745', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,851', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,868', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,872', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '34,877', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,995', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,002', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,008', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '35,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,134', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,142', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,146', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '35,151', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,277', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,284', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,290', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '35,296', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,398', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,398', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,413', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '35,413', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,532', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,539', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,545', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '35,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,674', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,680', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,686', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '35,686', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '35,699', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', \"save_model(model=GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '35,814', 'INFO', 'Initializing Linear Discriminant Analysis']\n", - "['2020-07-31 01', '41', '35,832', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '35,838', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,848', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,855', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,860', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '35,865', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,873', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,880', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,885', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '35,890', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,900', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,906', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,911', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '35,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,924', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,931', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,936', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '35,941', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,949', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,956', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,960', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '35,966', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,973', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,980', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,985', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '35,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,999', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,005', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,013', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '36,021', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,031', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,037', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,043', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '36,048', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,055', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,062', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,066', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '36,071', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,079', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,086', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,091', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '36,091', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '36,103', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '36,160', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '36,160', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '36,161', 'INFO', 'save_model(model=LinearDiscriminantAnalysis(n_components=None, priors=None, shrinkage=None,']\n", - "[\"solver='svd', store_covariance=False, tol=0.0001), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '36,161', 'INFO', 'Appending prep pipeline']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '36,165', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '36,168', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LinearDiscriminantAnalysis(n_components=None, priors=None, shrinkage=None,']\n", - "[\"solver='svd', store_covariance=False, tol=0.0001)]\"]\n", - "['2020-07-31 01', '41', '36,168', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '36,168', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '36,199', 'INFO', 'Initializing Extra Trees Classifier']\n", - "['2020-07-31 01', '41', '36,215', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '36,221', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,359', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,592', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,602', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '36,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,759', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,983', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '36,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,131', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '37,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '37,369', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '37,390', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,529', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '37,769', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '37,769', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '37,792', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,934', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,165', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,181', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '38,181', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '38,333', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,572', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,572', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '38,588', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '38,732', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,984', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,994', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '39,003', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,164', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '39,413', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '39,419', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '39,419', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,586', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '39,808', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '39,808', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '39,823', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,966', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '40,211', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'save_model(model=ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '40,333', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '40,395', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 01', '41', '40,395', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '40,410', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,501', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,532', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '40,537', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,584', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,603', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '40,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,655', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,667', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,678', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '40,687', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,727', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,740', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,751', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '40,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,800', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,813', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,820', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '40,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,873', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,886', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,897', 'INFO', 'Initializing Fold 7']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '40,906', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,946', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,959', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,970', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '40,980', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,020', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,032', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,043', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '41,054', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,096', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,109', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,119', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '41,128', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,175', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,188', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,199', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '41,199', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '41,228', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '41,348', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', \"save_model(model=XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '41,358', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)]']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '41,423', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 01', '41', '41,429', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '41,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,515', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,533', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,544', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '41,554', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,628', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,645', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,656', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '41,665', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,734', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,737', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,753', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '41,769', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,837', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,838', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,853', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '41,873', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,936', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,937', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,953', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '41,972', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,047', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,063', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,074', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '42,084', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,180', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,196', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,208', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '42,218', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,287', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,302', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,318', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '42,318', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,380', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,412', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,412', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '42,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,502', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,519', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,530', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '42,531', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '42,561', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '42,651', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '42,651', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '42,652', 'INFO', \"save_model(model=LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '42,652', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '42,663', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '42,777', 'INFO', 'Initializing CatBoost Classifier']\n", - "['2020-07-31 01', '41', '42,783', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '42,789', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '45,155', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '45,194', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '45,199', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '45,205', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '47,070', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '48,735', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '48,751', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '48,751', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '48,764', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '50,511', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '50,526', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '50,542', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '50,542', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '52,170', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '52,170', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '52,186', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '52,193', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '53,805', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '53,820', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '53,820', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '53,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '55,391', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '55,391', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '55,407', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '55,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '56,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '56,994', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '56,994', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '57,008', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '58,639', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '58,654', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '58,670', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '58,670', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,228', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '00,260', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '00,317', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '00,317', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '00,318', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '00,318', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '00,325', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ]']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '00,375', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 01', '42', '00,375', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'create_model(estimator=lr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '00,395', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '00,396', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,435', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,441', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,445', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '00,445', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,476', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,476', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,492', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '00,492', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,523', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,585', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,585', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,601', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '00,601', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,632', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,679', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '00,788', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,882', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,882', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'display_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '00,999', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 01', '42', '00,999', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'display_container', '2']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'create_model(estimator=lr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '01,010', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '01,033', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '01,034', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '01,035', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '01,035', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '01,039', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '01,039', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '01,040', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '01,046', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '01,050', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,094', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,101', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,113', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '01,118', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,160', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,166', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,180', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '01,185', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,230', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,236', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,248', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '01,253', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,301', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,314', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '01,322', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,368', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,374', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,378', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '01,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,432', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,438', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,444', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '01,444', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,503', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,511', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '01,511', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,561', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,568', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,582', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '01,587', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,626', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,633', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,646', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '01,651', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,694', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,700', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,715', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '01,716', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '01,724', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '01,766', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '01,930', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'save_model(model=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '01,936', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '01,960', 'INFO', 'Uploading results into container']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '01,960', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'create_model_container', '2']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'master_model_container', '2']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'display_container', '3']\n", - "['2020-07-31 01', '42', '01,994', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '01,994', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,000', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '02,000', 'INFO', 'create_model(estimator=dt, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '02,022', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '02,027', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '02,027', 'INFO', 'Decision Tree Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '02,028', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '02,035', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '02,040', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,046', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,054', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,069', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '02,073', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,078', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,085', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,099', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '02,104', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,108', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,115', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,133', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '02,137', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,143', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,149', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,165', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '02,170', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,174', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,198', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '02,204', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,208', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,216', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,234', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '02,239', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,244', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,252', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,268', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '02,273', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,279', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,290', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,307', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '02,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,326', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,342', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '02,347', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,352', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,360', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,376', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '02,377', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '02,385', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '02,390', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', \"save_model(model=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '02,526', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '02,530', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')]\"]\n", - "['2020-07-31 01', '42', '02,530', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,530', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '02,545', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '02,545', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'create_model_container', '3']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'master_model_container', '3']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'display_container', '4']\n", - "['2020-07-31 01', '42', '02,584', 'INFO', \"DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')\"]\n", - "['2020-07-31 01', '42', '02,584', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'create_model(estimator=rf, ensemble=False, method=None, fold=5, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '02,592', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '02,592', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '02,613', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '02,614', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '02,615', 'INFO', 'Defining folds']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '02,615', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '02,619', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '02,620', 'INFO', 'Random Forest Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '02,620', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '02,626', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '02,631', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,758', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,028', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '03,034', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,159', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,378', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,408', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '03,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,526', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,754', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,773', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '03,778', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,894', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '04,129', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '04,146', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '04,146', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '04,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '04,495', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '04,517', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '04,518', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '04,524', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '04,642', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '05,065', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '05,065', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'create_model_container', '4']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'master_model_container', '4']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'display_container', '5']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '05,131', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 01', '42', '05,131', 'INFO', \"compare_models(blacklist=None, whitelist=['rf', 'ada', 'gbc', 'et', 'xgboost', 'lightgbm', 'catboost'], fold=3, round=4, sort=Accuracy, n_select=1, turbo=True, verbose=True)\"]\n", - "['2020-07-31 01', '42', '05,131', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '05,132', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '05,132', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '05,155', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '05,156', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '05,160', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 01', '42', '05,160', 'INFO', 'Import successful']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Initializing Random Forest Classifier']\n", - "['2020-07-31 01', '42', '05,172', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '05,179', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '05,293', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '05,535', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '05,535', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '05,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '05,676', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '05,894', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '05,894', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '05,910', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,026', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '06,273', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '06,339', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '06,339', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '06,340', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '06,340', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '06,400', 'INFO', 'Initializing Ada Boost Classifier']\n", - "['2020-07-31 01', '42', '06,405', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '06,411', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,575', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,581', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,596', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '06,596', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,670', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '06,696', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123)]']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '06,825', 'INFO', 'Initializing Gradient Boosting Classifier']\n", - "['2020-07-31 01', '42', '06,825', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '06,841', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,929', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,929', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,944', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '06,944', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,030', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,146', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '07,241', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '07,241', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '07,242', 'INFO', \"save_model(model=GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '07,242', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '07,249', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '07,294', 'INFO', 'Initializing Extra Trees Classifier']\n", - "['2020-07-31 01', '42', '07,294', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '07,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,694', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,694', 'INFO', 'Initializing Fold 2']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '07,694', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,859', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,277', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '08,511', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'save_model(model=ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '08,705', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 01', '42', '08,721', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '08,727', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,759', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,781', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '08,794', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,828', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,842', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,853', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '08,864', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,900', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,913', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,924', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '08,925', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '08,947', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', \"save_model(model=XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)]']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '09,201', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 01', '42', '09,216', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '09,222', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,282', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,297', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '09,314', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,375', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,381', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,397', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '09,413', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,466', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '09,514', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', \"save_model(model=LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '09,613', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '09,722', 'INFO', 'Initializing CatBoost Classifier']\n", - "['2020-07-31 01', '42', '09,733', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '09,738', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '11,485', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '11,485', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '11,501', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '11,508', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '13,655', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '13,671', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '13,671', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '13,686', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '15,832', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '15,844', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '15,851', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '15,851', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '15,867', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '15,935', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '15,944', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ]']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '16,009', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 01', '42', '16,009', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'create_model(estimator=xgboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '16,024', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '16,024', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '16,025', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Extreme Gradient Boosting Imported succesfully']\n", - "['2020-07-31 01', '42', '16,027', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '16,030', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '16,031', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,079', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,084', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,099', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '16,099', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,177', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '16,177', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,224', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,240', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,256', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '16,271', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,334', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,349', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '16,349', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,396', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,412', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,427', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '16,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,474', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,490', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,505', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '16,521', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,584', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,599', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '16,599', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,646', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,662', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,677', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '16,693', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,740', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,755', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,771', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '16,771', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,834', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,849', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '16,865', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '16,865', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '16,880', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'display_container', '6']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', \"XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'display_container', '7']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', \"XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '17,048', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 01', '42', '17,049', 'INFO', 'tune_model(estimator=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), fold=10, round=4, n_iter=10, custom_grid=None, optimize=Accuracy, choose_better=False, verbose=True)']\n", - "['2020-07-31 01', '42', '17,049', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '17,051', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '17,051', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '17,077', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '17,078', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '17,078', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '17,079', 'INFO', 'Base model', 'Logistic Regression']\n", - "['2020-07-31 01', '42', '17,080', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '17,080', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '17,088', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 01', '42', '17,088', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 01', '42', '20,205', 'INFO', 'Random search completed']\n", - "['2020-07-31 01', '42', '20,213', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '20,220', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,253', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,261', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,282', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '20,289', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,320', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,328', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,347', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '20,354', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,386', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,394', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,414', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '20,420', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,451', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,460', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,478', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '20,484', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,516', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,525', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,543', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '20,549', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,589', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,609', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '20,615', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,651', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,661', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,683', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '20,689', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,723', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,732', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,756', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '20,762', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,796', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,805', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,825', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '20,832', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,863', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,872', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,894', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '20,895', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '20,904', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '20,934', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '20,934', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '20,935', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '21,014', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'create_model_container', '6']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'master_model_container', '6']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'display_container', '8']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '21,242', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 01', '42', '21,243', 'INFO', 'tune_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), fold=10, round=4, n_iter=10, custom_grid=None, optimize=Accuracy, choose_better=False, verbose=True)']\n", - "['2020-07-31 01', '42', '21,243', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '21,244', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '21,244', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '21,264', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '21,265', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '21,265', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Base model', 'Random Forest Classifier']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '21,272', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 01', '42', '21,272', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 01', '42', '22,790', 'INFO', 'Random search completed']\n", - "['2020-07-31 01', '42', '22,816', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '22,831', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '22,955', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,185', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,211', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '23,217', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '23,340', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,563', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,582', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '23,586', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '23,716', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,951', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,968', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '23,974', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,091', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '24,320', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '24,351', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '24,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,483', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '24,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '24,742', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '24,747', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,866', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,117', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,141', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '25,146', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '25,283', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,518', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,542', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '25,547', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '25,666', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,919', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,938', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '25,938', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '26,084', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '26,312', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '26,334', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '26,338', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '26,457', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '26,677', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '26,699', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '26,700', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '26,707', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '26,829', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '26,830', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '26,830', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '26,911', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '26,911', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '26,912', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '26,912', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '26,927', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'create_model_container', '7']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'master_model_container', '7']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'display_container', '9']\n", - "['2020-07-31 01', '42', '27,310', 'INFO', 'RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '27,310', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '27,315', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', \"ensemble_model(estimator=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Bagging, fold=10, n_estimators=10, round=4, choose_better=False, optimize=Accuracy, verbose=True)\"]\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '27,335', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '27,335', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '27,336', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '27,337', 'INFO', 'Base model', 'Decision Tree Classifier']\n", - "['2020-07-31 01', '42', '27,341', 'INFO', 'Importing untrained ensembler']\n", - "['2020-07-31 01', '42', '27,342', 'INFO', 'BaggingClassifier() succesfully imported']\n", - "['2020-07-31 01', '42', '27,347', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '27,347', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '27,349', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '27,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,384', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,416', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,430', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '27,435', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,487', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,504', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '27,509', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,534', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,567', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,582', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '27,587', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,612', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,644', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,658', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '27,663', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,686', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,733', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '27,738', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,764', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,799', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,816', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '27,822', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,852', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,892', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,904', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '27,904', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,938', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,970', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,985', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '27,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,015', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,047', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,062', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '28,067', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,139', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '28,140', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '28,150', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '28,173', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '28,173', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '28,174', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '28,239', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '28,239', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '28,240', 'INFO', 'save_model(model=BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '28,240', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '28,250', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)]']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '28,419', 'INFO', 'create_model_container', '8']\n", - "['2020-07-31 01', '42', '28,420', 'INFO', 'master_model_container', '8']\n", - "['2020-07-31 01', '42', '28,420', 'INFO', 'display_container', '10']\n", - "['2020-07-31 01', '42', '28,421', 'INFO', 'BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)']\n", - "['2020-07-31 01', '42', '28,421', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '28,427', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 01', '42', '28,428', 'INFO', \"ensemble_model(estimator=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Boosting, fold=10, n_estimators=10, round=4, choose_better=False, optimize=Accuracy, verbose=True)\"]\n", - "['2020-07-31 01', '42', '28,428', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '28,428', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '28,429', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '28,447', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '28,447', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '28,449', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '28,452', 'INFO', 'Base model', 'Decision Tree Classifier']\n", - "['2020-07-31 01', '42', '28,456', 'INFO', 'Importing untrained ensembler']\n", - "['2020-07-31 01', '42', '28,457', 'INFO', 'AdaBoostClassifier() succesfully imported']\n", - "['2020-07-31 01', '42', '28,463', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '28,463', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '28,464', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '28,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,508', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,531', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '28,536', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,577', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,591', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '28,597', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,634', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,644', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,659', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '28,665', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,708', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,735', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '28,741', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,778', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,789', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,809', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '28,817', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,858', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,868', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,885', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '28,891', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,920', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,933', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,953', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '28,960', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,003', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,013', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,028', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '29,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,071', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,082', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,099', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '29,103', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,134', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,144', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,161', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '29,162', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '29,174', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '29,219', 'INFO', 'Uploading results into container']\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "IOPub message rate exceeded.\n", - "The notebook server will temporarily stop sending output\n", - "to the client in order to avoid crashing it.\n", - "To change this limit, set the config variable\n", - "`--NotebookApp.iopub_msg_rate_limit`.\n", - "\n", - "Current values:\n", - "NotebookApp.iopub_msg_rate_limit=1000.0 (msgs/sec)\n", - "NotebookApp.rate_limit_window=3.0 (secs)\n", - "\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True]]\"]\n", - "['2020-07-31 01', '42', '41,690', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '41,690', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'create_model_container', '11']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'master_model_container', '11']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'display_container', '13']\n", - "['2020-07-31 01', '42', '42,224', 'INFO', \"[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True]\"]\n", - "['2020-07-31 01', '42', '42,224', 'INFO', 'stack_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '42,230', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '42,231', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=auc, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '42,231', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'plot type', 'auc']\n", - "['2020-07-31 01', '42', '42,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '42,413', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '42', '42,806', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '42,806', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '42,819', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '42,820', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=confusion_matrix, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '42,820', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '42,926', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '42,926', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '42,941', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '42,941', 'INFO', 'plot type', 'confusion_matrix']\n", - "['2020-07-31 01', '42', '42,957', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '42,957', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '42', '43,239', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '43,239', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '43,245', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '43,246', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=boundary, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '43,246', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'plot type', 'boundary']\n", - "['2020-07-31 01', '42', '43,491', 'INFO', 'Fitting StandardScaler()']\n", - "['2020-07-31 01', '42', '43,497', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 01', '42', '43,525', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '44,935', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '44,935', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '44,969', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '44,970', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=parameter, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '44,970', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'plot type', 'parameter']\n", - "['2020-07-31 01', '42', '45,092', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '45,092', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'create_model(estimator=catboost, ensemble=False, method=None, fold=10, round=4, cross_validation=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '45,120', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '45,121', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '45,122', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '45,122', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '45,127', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '45,128', 'INFO', 'CatBoost Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '45,128', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '45,133', 'INFO', 'Cross validation set to False']\n", - "['2020-07-31 01', '42', '45,134', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'create_model_container 11']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'master_model_container 11']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'display_container 13']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', '']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'create_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'interpret_model(estimator=, plot=summary, feature=None, observation=None)']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'plot type', 'summary']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '47,714', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '48,401', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '48,401', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'interpret_model(estimator=, plot=correlation, feature=None, observation=None)']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'plot type', 'correlation']\n", - "['2020-07-31 01', '42', '48,424', 'WARNING', 'No feature passed. Default value of feature used for correlation plot', 'WeekofPurchase']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '48,742', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '49,226', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '49,226', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '49,245', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '49,245', 'INFO', 'interpret_model(estimator=, plot=reason, feature=None, observation=12)']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'plot type', 'reason']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '49,564', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '49,970', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '49,970', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'Initializing automl()']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'automl(optimize=Recall, use_holdout=False)']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'Model Selection Basis', 'CV Results on Training set']\n", - "['2020-07-31 01', '42', '50,007', 'INFO', 'SubProcess finalize_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,008', 'INFO', 'Initializing finalize_model()']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', \"finalize_model(estimator=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False))']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Getting model name']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Finalizing Logistic Regression']\n", - "['2020-07-31 01', '42', '50,038', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '50,073', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,073', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', \"create_model(estimator=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '50,082', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '50,082', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Declaring custom model']\n", - "['2020-07-31 01', '42', '50,084', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '50,085', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '50,087', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '50,088', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,114', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,126', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '50,128', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,152', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,158', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '50,162', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '50,163', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '50,196', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,212', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,228', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '50,228', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,243', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,275', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,306', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,389', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,402', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,407', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '50,409', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,430', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'display_container', '14']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'display_container', '14']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'finalize_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'SubProcess finalize_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'automl() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '01,294', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '45', '01,295', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=best-model, verbose=True)']\n", - "['2020-07-31 01', '45', '01,295', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '45', '01,303', 'INFO', 'best-model.pkl saved in current working directory']\n", - "['2020-07-31 01', '45', '01,308', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '45', '01,309', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '03,776', 'INFO', 'Initializing deploy_model()']\n", - "['2020-07-31 01', '45', '03,776', 'INFO', \"deploy_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "[\"warm_start=False), model_name=best-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", - "['2020-07-31 01', '45', '03,798', 'INFO', 'Platform', 'AWS S3']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'Saving model in active working directory']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '45', '03,998', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=best-aws, verbose=False)']\n", - "['2020-07-31 01', '45', '03,998', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '45', '04,004', 'INFO', 'best-aws.pkl saved in current working directory']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'Initializing S3 client']\n", - "['2020-07-31 01', '45', '04,989', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '45', '04,989', 'INFO', 'deploy_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'get_config(variable=X_train)']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'Global variable', 'X_train returned']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,044', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,044', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 01', '45', '05,045', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 01', '45', '05,045', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'Initializing set_config()']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'set_config(variable=seed, value=999)']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'Global variable', 'seed updated']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'set_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'get_config() succesfully completed......................................']\n" - ] - } - ], - "source": [ - "get_system_logs()" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# 17. MLFlow UI" + "# 16. MLFlow UI" ] }, { diff --git a/examples/PyCaret 2 Clustering.ipynb b/examples/PyCaret 2 Clustering.ipynb index 44ad84eac9a1aa15aff8a1616f220764b3c2030c..11a332d675a03cf3efe9bca46615c98c67b76a90 100644 --- a/examples/PyCaret 2 Clustering.ipynb +++ b/examples/PyCaret 2 Clustering.ipynb @@ -14898,9339 +14898,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "# 10. Get System Logs" - ] - }, - { - "cell_type": "code", - "execution_count": 24, - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '40', '51,509', 'INFO', 'PyCaret Classification Module']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'version 2.0']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'USI', '1cda']\n", - "['2020-07-31 01', '40', '51,510', 'INFO', 'setup(data=(1070, 19), target=Purchase, train_size=0.7, sampling=True, sample_estimator=None, categorical_features=None, categorical_imputation=constant, ordinal_features=None,']\n", - "['high_cardinality_features=None, high_cardinality_method=frequency, numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None, remove_outliers=False, outliers_threshold=0.05,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, remove_perfect_collinearity=False, create_clusters=False, cluster_iter=20,']\n", - "['polynomial_features=False, polynomial_degree=2, trigonometry_features=False, polynomial_threshold=0.1, group_features=None,']\n", - "['group_names=None, feature_selection=False, feature_selection_threshold=0.8, feature_interaction=False, feature_ratio=False, interaction_threshold=0.01,']\n", - "['fix_imbalance=False, fix_imbalance_method=None, data_split_shuffle=True, folds_shuffle=False, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=juice1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 01', '40', '51,526', 'INFO', 'Checking environment']\n", - "['2020-07-31 01', '40', '51,526', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Memory', 'svmem(total=17032478720, available=12121403392, percent=28.8, used=4911075328, free=12121403392)']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Checking libraries']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 01', '40', '55,335', 'INFO', 'sklearn==0.23.1']\n", - "['2020-07-31 01', '40', '55,728', 'INFO', 'xgboost==0.90']\n", - "['2020-07-31 01', '40', '56,084', 'INFO', 'lightgbm==2.3.1']\n", - "['2020-07-31 01', '40', '56,736', 'INFO', 'catboost==0.20.2']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'mlflow==1.8.0']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Checking Exceptions']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '41', '00,697', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '41', '10,136', 'INFO', 'Copying data for preprocessing']\n", - "['2020-07-31 01', '41', '10,136', 'INFO', 'Declaring global variables']\n", - "['2020-07-31 01', '41', '10,162', 'INFO', 'Declaring preprocessing parameters']\n", - "['2020-07-31 01', '41', '10,162', 'INFO', 'Importing preprocessing module']\n", - "['2020-07-31 01', '41', '14,303', 'INFO', 'Creating preprocessing pipeline']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Preprocessing pipeline created successfully']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Creating grid variables']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Creating global containers']\n", - "['2020-07-31 01', '41', '16,270', 'INFO', 'Logging experiment in MLFlow']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False)]']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'create_model_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'master_model_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'display_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False)']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'setup() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'compare_models(blacklist=None, whitelist=None, fold=10, round=4, sort=Accuracy, n_select=1, turbo=True, verbose=True)']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '41', '23,820', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '41', '23,820', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '41', '23,838', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '41', '23,839', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '41', '23,910', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 01', '41', '23,922', 'INFO', 'Import successful']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Initializing Logistic Regression']\n", - "['2020-07-31 01', '41', '23,934', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '23,940', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '23,996', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,003', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,007', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '24,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,057', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,064', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,068', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '24,073', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,111', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,118', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,122', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '24,127', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,168', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,174', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,178', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '24,182', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,224', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,230', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,235', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '24,240', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,279', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,286', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,290', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '24,296', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,338', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,345', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,349', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '24,354', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,391', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,398', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,402', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '24,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,447', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,453', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,457', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '24,462', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,503', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,514', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '24,514', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '24,523', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'save_model(model=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '24,644', 'INFO', 'Initializing K Neighbors Classifier']\n", - "['2020-07-31 01', '41', '24,647', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '24,647', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,685', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,905', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,911', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '24,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,922', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,165', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,173', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '25,180', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,185', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,410', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,415', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '25,422', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,427', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,652', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,652', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '25,672', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,676', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,941', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,956', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '25,956', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,972', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,219', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,235', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '26,235', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,249', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,490', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,490', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '26,510', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,514', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,744', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,750', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '26,756', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,760', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,998', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,007', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,019', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,243', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,248', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '27,249', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '27,259', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '27,319', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '27,319', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '27,320', 'INFO', \"save_model(model=KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '27,320', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '27,330', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '27,338', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform')]\"]\n", - "['2020-07-31 01', '41', '27,338', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '27,338', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '27,380', 'INFO', 'Initializing Naive Bayes']\n", - "['2020-07-31 01', '41', '27,380', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '27,396', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,398', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,405', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,410', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '27,415', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,418', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,424', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,429', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '27,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,437', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,444', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,449', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '27,455', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,458', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,465', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,469', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '27,475', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,484', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,489', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '27,494', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,504', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,509', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '27,514', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,517', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,525', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,530', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '27,535', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,538', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,545', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,550', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '27,556', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,559', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,566', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,570', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,576', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,585', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,590', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '27,590', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '27,600', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'save_model(model=GaussianNB(priors=None, var_smoothing=1e-09), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), GaussianNB(priors=None, var_smoothing=1e-09)]']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '27,707', 'INFO', 'Initializing Decision Tree Classifier']\n", - "['2020-07-31 01', '41', '27,712', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '27,718', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,766', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,778', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '27,783', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,794', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,799', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '27,806', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,811', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,817', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,825', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '27,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,847', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,853', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '27,860', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,866', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,873', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,879', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '27,886', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,891', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,899', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,904', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '27,912', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,917', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,926', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,931', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '27,938', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,944', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,951', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,957', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '27,962', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,967', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,982', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,987', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,993', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,000', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,006', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,006', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,017', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,076', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,076', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,077', 'INFO', \"save_model(model=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '28,077', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,082', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,086', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')]\"]\n", - "['2020-07-31 01', '41', '28,087', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,087', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,135', 'INFO', 'Initializing SVM - Linear Kernel']\n", - "['2020-07-31 01', '41', '28,141', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '28,147', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,188', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,188', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,191', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,193', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,198', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '28,204', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,212', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,215', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,217', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,222', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '28,227', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,235', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,235', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,238', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,240', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,245', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '28,250', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,256', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,256', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,259', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,262', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,266', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '28,272', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,276', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,279', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,281', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,286', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '28,291', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,297', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,297', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,300', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,302', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,307', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '28,312', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,319', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,319', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,322', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,324', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,329', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '28,334', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,341', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,341', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,344', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,346', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,350', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '28,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,364', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,364', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,367', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,374', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '28,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,386', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,386', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,389', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,391', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,396', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,396', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,407', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,473', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'save_model(model=SGDClassifier(alpha=0.0001, average=False, class_weight=None,']\n", - "['early_stopping=False, epsilon=0.1, eta0=0.0, fit_intercept=True,']\n", - "[\"l1_ratio=0.15, learning_rate='optimal', loss='hinge',\"]\n", - "[\"max_iter=1000, n_iter_no_change=5, n_jobs=-1, penalty='l2',\"]\n", - "['power_t=0.5, random_state=123, shuffle=True, tol=0.001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,479', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), SGDClassifier(alpha=0.0001, average=False, class_weight=None,']\n", - "['early_stopping=False, epsilon=0.1, eta0=0.0, fit_intercept=True,']\n", - "[\"l1_ratio=0.15, learning_rate='optimal', loss='hinge',\"]\n", - "[\"max_iter=1000, n_iter_no_change=5, n_jobs=-1, penalty='l2',\"]\n", - "['power_t=0.5, random_state=123, shuffle=True, tol=0.001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False)]']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,532', 'INFO', 'Initializing Ridge Classifier']\n", - "['2020-07-31 01', '41', '28,532', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '28,547', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,630', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,630', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,646', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,662', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,662', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,665', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,667', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,676', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '28,683', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,687', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,687', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,690', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,692', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,697', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '28,706', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,711', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,711', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,713', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,715', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,720', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '28,726', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,730', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,730', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,733', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,735', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,739', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '28,744', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,748', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,749', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,751', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,754', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,759', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '28,764', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,768', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,768', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,771', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,778', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '28,784', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,788', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,791', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,793', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,799', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '28,804', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,809', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,809', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,813', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,816', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,821', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '28,827', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,831', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,831', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,834', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,836', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,841', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,841', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,853', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,934', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,935', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,935', 'INFO', 'save_model(model=RidgeClassifier(alpha=1.0, class_weight=None, copy_X=True, fit_intercept=True,']\n", - "[\"max_iter=None, normalize=False, random_state=123, solver='auto',\"]\n", - "['tol=0.001), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '28,935', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,940', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RidgeClassifier(alpha=1.0, class_weight=None, copy_X=True, fit_intercept=True,']\n", - "[\"max_iter=None, normalize=False, random_state=123, solver='auto',\"]\n", - "['tol=0.001)]']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,994', 'INFO', 'Initializing Random Forest Classifier']\n", - "['2020-07-31 01', '41', '29,000', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '29,006', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,127', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '29,363', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '29,378', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '29,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,496', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '29,712', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '29,716', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '29,723', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,834', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,077', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,087', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '30,095', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,207', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,439', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,448', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '30,455', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,569', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,799', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,799', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '30,814', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,933', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,175', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '31,183', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '31,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,538', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,547', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '31,553', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '31,666', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,902', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,913', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '31,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,034', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,387', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,626', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,630', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '32,630', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '32,642', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '32,760', 'INFO', 'Initializing Quadratic Discriminant Analysis']\n", - "['2020-07-31 01', '41', '32,776', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '32,776', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,838', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,838', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,948', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,948', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,948', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,995', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,995', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '33,010', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,010', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,023', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,029', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '33,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,039', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,045', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,050', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '33,050', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '33,062', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'save_model(model=QuadraticDiscriminantAnalysis(priors=None, reg_param=0.0,']\n", - "['store_covariance=False, tol=0.0001), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), QuadraticDiscriminantAnalysis(priors=None, reg_param=0.0,']\n", - "['store_covariance=False, tol=0.0001)]']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '33,161', 'INFO', 'Initializing Ada Boost Classifier']\n", - "['2020-07-31 01', '41', '33,161', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '33,177', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,239', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,255', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,255', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '33,270', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,333', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,348', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,348', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '33,364', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,427', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,442', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,442', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '33,458', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,520', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,536', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,552', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '33,552', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,614', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,649', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,655', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '33,660', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,730', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,746', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,761', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '33,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,839', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,855', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,855', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '33,871', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,933', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,949', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,964', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '33,964', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,027', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,136', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '34,171', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '34,240', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123)]']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '34,314', 'INFO', 'Initializing Gradient Boosting Classifier']\n", - "['2020-07-31 01', '41', '34,322', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '34,328', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,447', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,455', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,460', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '34,466', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,582', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,589', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,594', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '34,600', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,726', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,733', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,739', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '34,745', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,851', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,868', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,872', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '34,877', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,995', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,002', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,008', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '35,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,134', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,142', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,146', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '35,151', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,277', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,284', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,290', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '35,296', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,398', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,398', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,413', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '35,413', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,532', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,539', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,545', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '35,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,674', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,680', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,686', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '35,686', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '35,699', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', \"save_model(model=GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '35,814', 'INFO', 'Initializing Linear Discriminant Analysis']\n", - "['2020-07-31 01', '41', '35,832', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '35,838', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,848', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,855', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,860', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '35,865', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,873', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,880', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,885', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '35,890', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,900', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,906', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,911', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '35,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,924', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,931', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,936', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '35,941', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,949', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,956', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,960', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '35,966', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,973', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,980', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,985', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '35,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,999', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,005', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,013', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '36,021', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,031', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,037', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,043', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '36,048', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,055', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,062', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,066', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '36,071', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,079', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,086', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,091', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '36,091', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '36,103', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '36,160', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '36,160', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '36,161', 'INFO', 'save_model(model=LinearDiscriminantAnalysis(n_components=None, priors=None, shrinkage=None,']\n", - "[\"solver='svd', store_covariance=False, tol=0.0001), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '36,161', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '36,165', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '36,168', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LinearDiscriminantAnalysis(n_components=None, priors=None, shrinkage=None,']\n", - "[\"solver='svd', store_covariance=False, tol=0.0001)]\"]\n", - "['2020-07-31 01', '41', '36,168', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '36,168', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '36,199', 'INFO', 'Initializing Extra Trees Classifier']\n", - "['2020-07-31 01', '41', '36,215', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '36,221', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,359', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,592', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,602', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '36,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,759', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,983', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '36,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,131', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '37,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '37,369', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '37,390', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,529', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '37,769', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '37,769', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '37,792', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,934', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,165', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,181', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '38,181', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '38,333', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,572', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,572', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '38,588', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '38,732', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,984', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,994', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '39,003', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,164', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '39,413', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '39,419', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '39,419', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,586', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '39,808', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '39,808', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '39,823', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,966', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '40,211', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'save_model(model=ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '40,333', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '40,395', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 01', '41', '40,395', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '40,410', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,501', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,532', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '40,537', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,584', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,603', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '40,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,655', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,667', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,678', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '40,687', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,727', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,740', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,751', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '40,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,800', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,813', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,820', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '40,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,873', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,886', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,897', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '40,906', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,946', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,959', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,970', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '40,980', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,020', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,032', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,043', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '41,054', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,096', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,109', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,119', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '41,128', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,175', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,188', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,199', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '41,199', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '41,228', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '41,348', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', \"save_model(model=XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '41,358', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)]']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '41,423', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 01', '41', '41,429', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '41,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,515', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,533', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,544', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '41,554', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,628', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,645', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,656', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '41,665', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,734', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,737', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,753', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '41,769', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,837', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,838', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,853', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '41,873', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,936', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,937', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,953', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '41,972', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,047', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,063', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,074', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '42,084', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,180', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,196', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,208', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '42,218', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,287', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,302', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,318', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '42,318', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,380', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,412', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,412', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '42,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,502', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,519', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,530', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '42,531', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '42,561', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '42,651', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '42,651', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '42,652', 'INFO', \"save_model(model=LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '42,652', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '42,663', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '42,777', 'INFO', 'Initializing CatBoost Classifier']\n", - "['2020-07-31 01', '41', '42,783', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '42,789', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '45,155', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '45,194', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '45,199', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '45,205', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '47,070', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '48,735', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '48,751', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '48,751', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '48,764', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '50,511', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '50,526', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '50,542', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '50,542', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '52,170', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '52,170', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '52,186', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '52,193', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '53,805', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '53,820', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '53,820', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '53,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '55,391', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '55,391', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '55,407', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '55,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '56,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '56,994', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '56,994', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '57,008', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '58,639', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '58,654', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '58,670', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '58,670', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,228', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '00,260', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '00,317', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '00,317', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '00,318', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '00,318', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '00,325', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ]']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '00,375', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 01', '42', '00,375', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'create_model(estimator=lr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '00,395', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '00,396', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,435', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,441', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,445', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '00,445', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,476', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,476', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,492', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '00,492', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,523', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,585', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,585', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,601', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '00,601', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,632', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,679', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,882', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,882', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'display_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '00,999', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 01', '42', '00,999', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'display_container', '2']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'create_model(estimator=lr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '01,010', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '01,033', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '01,034', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '01,035', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '01,035', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '01,039', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '01,039', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '01,040', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '01,046', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '01,050', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,094', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,101', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,113', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '01,118', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,160', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,166', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,180', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '01,185', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,230', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,236', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,248', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '01,253', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,301', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,314', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '01,322', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,368', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,374', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,378', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '01,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,432', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,438', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,444', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '01,444', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,503', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,511', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '01,511', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,561', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,568', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,582', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '01,587', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,626', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,633', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,646', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '01,651', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,694', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,700', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,715', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '01,716', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '01,724', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '01,766', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '01,930', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'save_model(model=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '01,936', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '01,960', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '01,960', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'create_model_container', '2']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'master_model_container', '2']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'display_container', '3']\n", - "['2020-07-31 01', '42', '01,994', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '01,994', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,000', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '02,000', 'INFO', 'create_model(estimator=dt, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '02,022', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '02,027', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '02,027', 'INFO', 'Decision Tree Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '02,028', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '02,035', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '02,040', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,046', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,054', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,069', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '02,073', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,078', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,085', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,099', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '02,104', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,108', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,115', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,133', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '02,137', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,143', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,149', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,165', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '02,170', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,174', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,198', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '02,204', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,208', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,216', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,234', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '02,239', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,244', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,252', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,268', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '02,273', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,279', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,290', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,307', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '02,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,326', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,342', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '02,347', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,352', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,360', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,376', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '02,377', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '02,385', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '02,390', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', \"save_model(model=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '02,526', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '02,530', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')]\"]\n", - "['2020-07-31 01', '42', '02,530', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,530', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '02,545', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '02,545', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'create_model_container', '3']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'master_model_container', '3']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'display_container', '4']\n", - "['2020-07-31 01', '42', '02,584', 'INFO', \"DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')\"]\n", - "['2020-07-31 01', '42', '02,584', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'create_model(estimator=rf, ensemble=False, method=None, fold=5, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '02,592', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '02,592', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '02,613', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '02,614', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '02,615', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '02,615', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '02,619', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '02,620', 'INFO', 'Random Forest Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '02,620', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '02,626', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '02,631', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,758', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,028', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '03,034', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,159', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,378', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,408', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '03,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,526', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,754', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,773', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '03,778', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,894', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '04,129', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '04,146', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '04,146', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '04,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '04,495', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '04,517', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '04,518', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '04,524', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '04,642', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '05,065', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '05,065', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'create_model_container', '4']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'master_model_container', '4']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'display_container', '5']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '05,131', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 01', '42', '05,131', 'INFO', \"compare_models(blacklist=None, whitelist=['rf', 'ada', 'gbc', 'et', 'xgboost', 'lightgbm', 'catboost'], fold=3, round=4, sort=Accuracy, n_select=1, turbo=True, verbose=True)\"]\n", - "['2020-07-31 01', '42', '05,131', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '05,132', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '05,132', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '05,155', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '05,156', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '05,160', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 01', '42', '05,160', 'INFO', 'Import successful']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Initializing Random Forest Classifier']\n", - "['2020-07-31 01', '42', '05,172', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '05,179', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '05,293', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '05,535', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '05,535', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '05,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '05,676', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '05,894', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '05,894', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '05,910', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,026', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '06,273', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '06,339', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '06,339', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '06,340', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '06,340', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '06,400', 'INFO', 'Initializing Ada Boost Classifier']\n", - "['2020-07-31 01', '42', '06,405', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '06,411', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,575', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,581', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,596', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '06,596', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,670', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '06,696', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123)]']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '06,825', 'INFO', 'Initializing Gradient Boosting Classifier']\n", - "['2020-07-31 01', '42', '06,825', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '06,841', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,929', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,929', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,944', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '06,944', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,030', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,146', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '07,241', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '07,241', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '07,242', 'INFO', \"save_model(model=GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '07,242', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '07,249', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '07,294', 'INFO', 'Initializing Extra Trees Classifier']\n", - "['2020-07-31 01', '42', '07,294', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '07,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,694', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,694', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '07,694', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,859', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,277', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '08,511', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'save_model(model=ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '08,705', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 01', '42', '08,721', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '08,727', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,759', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,781', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '08,794', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,828', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,842', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,853', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '08,864', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,900', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,913', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,924', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '08,925', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '08,947', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', \"save_model(model=XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)]']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '09,201', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 01', '42', '09,216', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '09,222', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,282', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,297', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '09,314', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,375', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,381', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,397', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '09,413', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,466', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '09,514', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', \"save_model(model=LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '09,613', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '09,722', 'INFO', 'Initializing CatBoost Classifier']\n", - "['2020-07-31 01', '42', '09,733', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '09,738', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '11,485', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '11,485', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '11,501', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '11,508', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '13,655', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '13,671', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '13,671', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '13,686', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '15,832', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '15,844', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '15,851', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '15,851', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '15,867', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '15,935', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '15,944', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ]']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '16,009', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 01', '42', '16,009', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'create_model(estimator=xgboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '16,024', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '16,024', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '16,025', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Extreme Gradient Boosting Imported succesfully']\n", - "['2020-07-31 01', '42', '16,027', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '16,030', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '16,031', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,079', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,084', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,099', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '16,099', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,177', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '16,177', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,224', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,240', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,256', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '16,271', 'INFO', 'Fitting Model']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '16,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,334', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,349', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '16,349', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,396', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,412', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,427', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '16,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,474', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,490', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,505', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '16,521', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,584', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,599', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '16,599', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,646', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,662', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,677', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '16,693', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,740', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,755', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,771', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '16,771', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,834', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,849', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,865', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '16,865', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '16,880', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'display_container', '6']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', \"XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'display_container', '7']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', \"XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '17,048', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 01', '42', '17,049', 'INFO', 'tune_model(estimator=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), fold=10, round=4, n_iter=10, custom_grid=None, optimize=Accuracy, choose_better=False, verbose=True)']\n", - "['2020-07-31 01', '42', '17,049', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '17,051', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '17,051', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '17,077', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '17,078', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '17,078', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '17,079', 'INFO', 'Base model', 'Logistic Regression']\n", - "['2020-07-31 01', '42', '17,080', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '17,080', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '17,088', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 01', '42', '17,088', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 01', '42', '20,205', 'INFO', 'Random search completed']\n", - "['2020-07-31 01', '42', '20,213', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '20,220', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,253', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,261', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,282', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '20,289', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,320', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,328', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,347', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '20,354', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,386', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,394', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,414', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '20,420', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,451', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,460', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,478', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '20,484', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,516', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,525', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,543', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '20,549', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,589', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,609', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '20,615', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,651', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,661', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,683', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '20,689', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,723', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,732', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,756', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '20,762', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,796', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,805', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,825', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '20,832', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,863', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,872', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,894', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '20,895', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '20,904', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '20,934', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '20,934', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '20,935', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '21,014', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'create_model_container', '6']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'master_model_container', '6']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'display_container', '8']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '21,242', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 01', '42', '21,243', 'INFO', 'tune_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), fold=10, round=4, n_iter=10, custom_grid=None, optimize=Accuracy, choose_better=False, verbose=True)']\n", - "['2020-07-31 01', '42', '21,243', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '21,244', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '21,244', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '21,264', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '21,265', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '21,265', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Base model', 'Random Forest Classifier']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '21,272', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 01', '42', '21,272', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 01', '42', '22,790', 'INFO', 'Random search completed']\n", - "['2020-07-31 01', '42', '22,816', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '22,831', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '22,955', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,185', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,211', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '23,217', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '23,340', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,563', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,582', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '23,586', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '23,716', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,951', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,968', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '23,974', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,091', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '24,320', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '24,351', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '24,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,483', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '24,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '24,742', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '24,747', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,866', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,117', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,141', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '25,146', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '25,283', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,518', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,542', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '25,547', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '25,666', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,919', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,938', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '25,938', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '26,084', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '26,312', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '26,334', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '26,338', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '26,457', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '26,677', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '26,699', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '26,700', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '26,707', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '26,829', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '26,830', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '26,830', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '26,911', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '26,911', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '26,912', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '26,912', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '26,927', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'create_model_container', '7']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'master_model_container', '7']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'display_container', '9']\n", - "['2020-07-31 01', '42', '27,310', 'INFO', 'RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '27,310', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '27,315', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', \"ensemble_model(estimator=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Bagging, fold=10, n_estimators=10, round=4, choose_better=False, optimize=Accuracy, verbose=True)\"]\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '27,335', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '27,335', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '27,336', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '27,337', 'INFO', 'Base model', 'Decision Tree Classifier']\n", - "['2020-07-31 01', '42', '27,341', 'INFO', 'Importing untrained ensembler']\n", - "['2020-07-31 01', '42', '27,342', 'INFO', 'BaggingClassifier() succesfully imported']\n", - "['2020-07-31 01', '42', '27,347', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '27,347', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '27,349', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '27,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,384', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,416', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,430', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '27,435', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,487', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,504', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '27,509', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,534', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,567', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,582', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '27,587', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,612', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,644', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,658', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '27,663', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,686', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,733', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '27,738', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,764', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,799', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,816', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '27,822', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,852', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,892', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,904', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '27,904', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,938', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,970', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,985', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '27,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,015', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,047', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,062', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '28,067', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,139', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '28,140', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '28,150', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '28,173', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '28,173', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '28,174', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '28,239', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '28,239', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '28,240', 'INFO', 'save_model(model=BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '28,240', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '28,250', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)]']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '28,419', 'INFO', 'create_model_container', '8']\n", - "['2020-07-31 01', '42', '28,420', 'INFO', 'master_model_container', '8']\n", - "['2020-07-31 01', '42', '28,420', 'INFO', 'display_container', '10']\n", - "['2020-07-31 01', '42', '28,421', 'INFO', 'BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)']\n", - "['2020-07-31 01', '42', '28,421', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '28,427', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 01', '42', '28,428', 'INFO', \"ensemble_model(estimator=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Boosting, fold=10, n_estimators=10, round=4, choose_better=False, optimize=Accuracy, verbose=True)\"]\n", - "['2020-07-31 01', '42', '28,428', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '28,428', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '28,429', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '28,447', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '28,447', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '28,449', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '28,452', 'INFO', 'Base model', 'Decision Tree Classifier']\n", - "['2020-07-31 01', '42', '28,456', 'INFO', 'Importing untrained ensembler']\n", - "['2020-07-31 01', '42', '28,457', 'INFO', 'AdaBoostClassifier() succesfully imported']\n", - "['2020-07-31 01', '42', '28,463', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '28,463', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '28,464', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '28,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,508', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,531', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '28,536', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,577', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,591', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '28,597', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,634', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,644', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,659', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '28,665', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,708', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,735', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '28,741', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,778', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,789', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,809', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '28,817', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,858', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,868', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,885', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '28,891', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,920', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,933', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,953', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '28,960', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,003', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,013', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,028', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '29,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,071', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,082', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,099', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '29,103', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,134', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,144', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,161', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '29,162', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '29,174', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '29,219', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '29,219', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '29,220', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '29,282', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '29,282', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '29,283', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '29,283', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '29,297', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '29,304', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123)]']\n", - "['2020-07-31 01', '42', '29,304', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '29,304', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '29,449', 'INFO', 'create_model_container', '9']\n", - "['2020-07-31 01', '42', '29,449', 'INFO', 'master_model_container', '9']\n", - "['2020-07-31 01', '42', '29,449', 'INFO', 'display_container', '11']\n", - "['2020-07-31 01', '42', '29,450', 'INFO', \"AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123)']\n", - "['2020-07-31 01', '42', '29,450', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '29,456', 'INFO', 'Initializing blend_models()']\n", - "['2020-07-31 01', '42', '29,459', 'INFO', \"blend_models(estimator_list=[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)], fold=10, round=4, choose_better=False, optimize=Accuracy, method=soft, turbo=True, verbose=True)']\n", - "['2020-07-31 01', '42', '29,459', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '29,461', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '29,461', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '29,481', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '29,481', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '29,482', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '29,482', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '29,486', 'INFO', 'Defining model names in estimator_list']\n", - "['2020-07-31 01', '42', '29,656', 'INFO', 'n_jobs multiple passed']\n", - "['2020-07-31 01', '42', '29,664', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '29,672', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,826', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '30,112', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '30,136', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '30,147', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '30,300', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '30,559', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '30,571', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '30,576', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '30,719', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '30,986', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '31,001', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '31,007', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '31,147', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '31,442', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '31,460', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '31,466', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '31,602', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '31,896', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '31,921', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '31,927', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '32,074', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '32,325', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '32,340', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '32,346', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '32,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '32,810', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '32,826', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '32,836', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '32,985', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '33,258', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '33,272', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '33,281', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '33,422', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '33,716', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '33,731', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '33,736', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '33,878', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '34,182', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '34,205', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '34,206', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '34,219', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '34,367', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '34,368', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '34,368', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '34,421', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '34,422', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '34,429', 'INFO', \"save_model(model=VotingClassifier(estimators=[('Bagging Classifier_1',\"]\n", - "['BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['r...']\n", - "['max_depth=30,']\n", - "[\"max_features='auto',\"]\n", - "['max_leaf_nodes=None,']\n", - "['max_samples=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False,']\n", - "['random_state=123,']\n", - "['verbose=0,']\n", - "['warm_start=False))],']\n", - "['flatten_transform=True, n_jobs=-1, verbose=False,']\n", - "[\"voting='soft', weights=None), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '42', '34,429', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '34,478', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '34,488', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), VotingClassifier(estimators=[('Bagging Classifier_1',\"]\n", - "['BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['r...']\n", - "['max_depth=30,']\n", - "[\"max_features='auto',\"]\n", - "['max_leaf_nodes=None,']\n", - "['max_samples=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False,']\n", - "['random_state=123,']\n", - "['verbose=0,']\n", - "['warm_start=False))],']\n", - "['flatten_transform=True, n_jobs=-1, verbose=False,']\n", - "[\"voting='soft', weights=None)]\"]\n", - "['2020-07-31 01', '42', '34,489', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '34,489', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '34,946', 'INFO', 'create_model_container', '10']\n", - "['2020-07-31 01', '42', '34,947', 'INFO', 'master_model_container', '10']\n", - "['2020-07-31 01', '42', '34,947', 'INFO', 'display_container', '12']\n", - "['2020-07-31 01', '42', '34,953', 'INFO', \"VotingClassifier(estimators=[('Bagging Classifier_1',\"]\n", - "['BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['r...']\n", - "['max_depth=30,']\n", - "[\"max_features='auto',\"]\n", - "['max_leaf_nodes=None,']\n", - "['max_samples=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False,']\n", - "['random_state=123,']\n", - "['verbose=0,']\n", - "['warm_start=False))],']\n", - "['flatten_transform=True, n_jobs=-1, verbose=False,']\n", - "[\"voting='soft', weights=None)\"]\n", - "['2020-07-31 01', '42', '34,954', 'INFO', 'blend_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '34,961', 'INFO', 'Initializing stack_models()']\n", - "['2020-07-31 01', '42', '34,963', 'INFO', \"stack_models(estimator_list=[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)], meta_model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), fold=10, round=4, method=soft, restack=True, plot=False, choose_better=False, optimize=Accuracy, finalize=False, verbose=True)']\n", - "['2020-07-31 01', '42', '34,964', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '34,965', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '34,965', 'INFO', 'Copying estimator list']\n", - "['2020-07-31 01', '42', '34,970', 'INFO', 'Defining meta model']\n", - "['2020-07-31 01', '42', '34,972', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '34,990', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '34,991', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '34,993', 'INFO', 'Getting model names']\n", - "['2020-07-31 01', '42', '34,995', 'INFO', 'Checking base model', 'AdaBoostClassifier']\n", - "['2020-07-31 01', '42', '34,999', 'INFO', 'Fitting base model']\n", - "['2020-07-31 01', '42', '35,039', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 01', '42', '35,373', 'INFO', 'Checking base model', 'BaggingClassifier']\n", - "['2020-07-31 01', '42', '35,378', 'INFO', 'Fitting base model']\n", - "['2020-07-31 01', '42', '35,408', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 01', '42', '35,751', 'INFO', 'Checking base model', 'RandomForestClassifier']\n", - "['2020-07-31 01', '42', '35,751', 'INFO', 'Fitting base model']\n", - "['2020-07-31 01', '42', '35,872', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 01', '42', '37,647', 'INFO', 'Base layer complete']\n", - "['2020-07-31 01', '42', '37,802', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '37,804', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '37,809', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '37,921', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '38,152', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '38,166', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '38,172', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '38,289', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '38,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '38,540', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '38,554', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '38,673', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '38,892', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '38,922', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '38,929', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '39,040', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '39,259', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '39,274', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '39,286', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '39,406', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '39,641', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '39,660', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '39,660', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '39,792', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '40,042', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '40,064', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '40,070', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '40,189', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '40,439', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '40,454', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '40,461', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '40,574', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '40,793', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '40,808', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '40,816', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '40,938', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '41,188', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '41,209', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '41,215', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '41,339', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '41,557', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '41,572', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '41,572', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '41,583', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '41,583', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '41,583', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '41,658', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '41,658', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '41,658', 'INFO', \"save_model(model=[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True], model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '42', '41,658', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '41,674', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '41,690', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), [AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True]]\"]\n", - "['2020-07-31 01', '42', '41,690', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '41,690', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'create_model_container', '11']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'master_model_container', '11']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'display_container', '13']\n", - "['2020-07-31 01', '42', '42,224', 'INFO', \"[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True]\"]\n", - "['2020-07-31 01', '42', '42,224', 'INFO', 'stack_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '42,230', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '42,231', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=auc, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '42,231', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'plot type', 'auc']\n", - "['2020-07-31 01', '42', '42,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '42,413', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '42', '42,806', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '42,806', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '42,819', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '42,820', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=confusion_matrix, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '42,820', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '42,926', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '42,926', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '42,941', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '42,941', 'INFO', 'plot type', 'confusion_matrix']\n", - "['2020-07-31 01', '42', '42,957', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '42,957', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '42', '43,239', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '43,239', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '43,245', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '43,246', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=boundary, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '43,246', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'plot type', 'boundary']\n", - "['2020-07-31 01', '42', '43,491', 'INFO', 'Fitting StandardScaler()']\n", - "['2020-07-31 01', '42', '43,497', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 01', '42', '43,525', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '44,935', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '44,935', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '44,969', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '44,970', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=parameter, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '44,970', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'plot type', 'parameter']\n", - "['2020-07-31 01', '42', '45,092', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '45,092', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'create_model(estimator=catboost, ensemble=False, method=None, fold=10, round=4, cross_validation=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '45,120', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '45,121', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '45,122', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '45,122', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '45,127', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '45,128', 'INFO', 'CatBoost Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '45,128', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '45,133', 'INFO', 'Cross validation set to False']\n", - "['2020-07-31 01', '42', '45,134', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'create_model_container 11']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'master_model_container 11']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'display_container 13']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', '']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'create_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'interpret_model(estimator=, plot=summary, feature=None, observation=None)']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'plot type', 'summary']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '47,714', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '48,401', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '48,401', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'interpret_model(estimator=, plot=correlation, feature=None, observation=None)']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'plot type', 'correlation']\n", - "['2020-07-31 01', '42', '48,424', 'WARNING', 'No feature passed. Default value of feature used for correlation plot', 'WeekofPurchase']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '48,742', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '49,226', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '49,226', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '49,245', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '49,245', 'INFO', 'interpret_model(estimator=, plot=reason, feature=None, observation=12)']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'plot type', 'reason']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '49,564', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '49,970', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '49,970', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'Initializing automl()']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'automl(optimize=Recall, use_holdout=False)']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'Model Selection Basis', 'CV Results on Training set']\n", - "['2020-07-31 01', '42', '50,007', 'INFO', 'SubProcess finalize_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,008', 'INFO', 'Initializing finalize_model()']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', \"finalize_model(estimator=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False))']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Getting model name']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Finalizing Logistic Regression']\n", - "['2020-07-31 01', '42', '50,038', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '50,073', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,073', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', \"create_model(estimator=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '50,082', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '50,082', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Declaring custom model']\n", - "['2020-07-31 01', '42', '50,084', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '50,085', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '50,087', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '50,088', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,114', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,126', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '50,128', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,152', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,158', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,162', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '50,163', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '50,196', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,212', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,228', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '50,228', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,243', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,275', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,306', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,389', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,402', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,407', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '50,409', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,430', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'display_container', '14']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'display_container', '14']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'finalize_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'SubProcess finalize_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'automl() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '01,294', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '45', '01,295', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=best-model, verbose=True)']\n", - "['2020-07-31 01', '45', '01,295', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '45', '01,303', 'INFO', 'best-model.pkl saved in current working directory']\n", - "['2020-07-31 01', '45', '01,308', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '45', '01,309', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '03,776', 'INFO', 'Initializing deploy_model()']\n", - "['2020-07-31 01', '45', '03,776', 'INFO', \"deploy_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "[\"warm_start=False), model_name=best-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", - "['2020-07-31 01', '45', '03,798', 'INFO', 'Platform', 'AWS S3']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'Saving model in active working directory']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '45', '03,998', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=best-aws, verbose=False)']\n", - "['2020-07-31 01', '45', '03,998', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '45', '04,004', 'INFO', 'best-aws.pkl saved in current working directory']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'Initializing S3 client']\n", - "['2020-07-31 01', '45', '04,989', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '45', '04,989', 'INFO', 'deploy_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'get_config(variable=X_train)']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'Global variable', 'X_train returned']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,044', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,044', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 01', '45', '05,045', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 01', '45', '05,045', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'Initializing set_config()']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'set_config(variable=seed, value=999)']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'Global variable', 'seed updated']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'set_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '23,821', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '23,822', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=FEATURE, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '23,822', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '27,575', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '27,577', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=feature, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '27,577', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'plot type', 'feature']\n", - "['2020-07-31 01', '45', '27,691', 'WARNING', 'No coef_ found. Trying feature_importances_']\n", - "['2020-07-31 01', '45', '27,906', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '45', '27,906', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '31,933', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '31,934', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=pr, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '31,934', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'plot type', 'pr']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '45', '32,057', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '45', '32,376', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '45', '32,376', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '42,906', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '42,907', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=class_report, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '42,907', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'plot type', 'class_report']\n", - "['2020-07-31 01', '45', '43,032', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '45', '43,033', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '45', '43,362', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '45', '43,362', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '16,732', 'INFO', 'PyCaret Regression Module']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'version 2.0']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'USI', '5b1c']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'setup(data=(1338, 7), target=charges, train_size=0.7, sampling=True, sample_estimator=None, categorical_features=None, categorical_imputation=constant, ordinal_features=None,']\n", - "['high_cardinality_features=None, high_cardinality_method=frequency, numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None, remove_outliers=False, outliers_threshold=0.05,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, remove_perfect_collinearity=False, create_clusters=False, cluster_iter=20,']\n", - "['polynomial_features=False, polynomial_degree=2, trigonometry_features=False, polynomial_threshold=0.1, group_features=None,']\n", - "['group_names=None, feature_selection=False, feature_selection_threshold=0.8, feature_interaction=False, feature_ratio=False, interaction_threshold=0.01, transform_target=False,']\n", - "['transform_target_method=box-cox, data_split_shuffle=True, folds_shuffle=False, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=insurance1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'Checking environment']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 08', '44', '16,734', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Memory', 'svmem(total=17032478720, available=12508303360, percent=26.6, used=4524175360, free=12508303360)']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Checking libraries']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 08', '44', '17,421', 'INFO', 'sklearn==0.23.1']\n", - "['2020-07-31 08', '44', '17,518', 'INFO', 'xgboost==0.90']\n", - "['2020-07-31 08', '44', '17,654', 'INFO', 'lightgbm==2.3.1']\n", - "['2020-07-31 08', '44', '17,720', 'INFO', 'catboost==0.20.2']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'mlflow==1.8.0']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Checking Exceptions']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '44', '21,667', 'INFO', 'Copying data for preprocessing']\n", - "['2020-07-31 08', '44', '21,667', 'INFO', 'Declaring global variables']\n", - "['2020-07-31 08', '44', '21,672', 'INFO', 'Declaring preprocessing parameters']\n", - "['2020-07-31 08', '44', '21,672', 'INFO', 'Importing preprocessing module']\n", - "['2020-07-31 08', '44', '22,570', 'INFO', 'Creating preprocessing pipeline']\n", - "['2020-07-31 08', '44', '23,523', 'INFO', 'Preprocessing pipeline created successfully']\n", - "['2020-07-31 08', '44', '23,523', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '23,523', 'INFO', 'Creating grid variables']\n", - "['2020-07-31 08', '44', '23,525', 'INFO', 'Creating global containers']\n", - "['2020-07-31 08', '44', '23,590', 'INFO', 'Logging experiment in MLFlow']\n", - "['2020-07-31 08', '44', '23,723', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '23,724', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '23,728', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", - "['2020-07-31 08', '44', '23,728', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '23,732', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '23,740', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), None]']\n", - "['2020-07-31 08', '44', '23,740', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '23,740', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'create_model_container', '0']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'master_model_container', '0']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'display_container', '0']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'setup() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'compare_models(blacklist=None, whitelist=None, fold=5, round=4, sort=R2, n_select=1, turbo=True, verbose=True)']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '44', '25,754', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '44', '25,756', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '44', '25,767', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 08', '44', '25,768', 'INFO', 'Import successful']\n", - "['2020-07-31 08', '44', '25,774', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '44', '25,774', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '44', '25,774', 'INFO', 'Initializing Linear Regression']\n", - "['2020-07-31 08', '44', '25,782', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '25,788', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,795', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,796', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,797', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,856', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '25,873', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,876', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,877', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,877', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,883', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '25,888', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,892', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,894', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,894', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,900', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '25,905', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,907', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,909', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,909', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,915', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '25,920', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,923', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,925', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,925', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,931', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '25,932', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '25,940', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '25,990', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '25,990', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '25,991', 'INFO', 'save_model(model=LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '25,991', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '25,995', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '25,999', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), None]']\n", - "['2020-07-31 08', '44', '25,999', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '25,999', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,024', 'INFO', 'Initializing Lasso Regression']\n", - "['2020-07-31 08', '44', '26,039', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,051', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,056', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,057', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,058', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,063', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,071', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,074', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,076', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,076', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,082', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,088', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,093', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,093', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,099', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,105', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,108', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,109', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,110', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,115', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,121', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,125', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,126', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,126', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,132', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,132', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,140', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,196', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,197', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,197', 'INFO', 'save_model(model=Lasso(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=1000,']\n", - "['normalize=False, positive=False, precompute=False, random_state=123,']\n", - "[\"selection='cyclic', tol=0.0001, warm_start=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '26,197', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,201', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,205', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Lasso(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=1000,']\n", - "['normalize=False, positive=False, precompute=False, random_state=123,']\n", - "[\"selection='cyclic', tol=0.0001, warm_start=False), None]\"]\n", - "['2020-07-31 08', '44', '26,206', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,206', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,250', 'INFO', 'Initializing Ridge Regression']\n", - "['2020-07-31 08', '44', '26,255', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,260', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,265', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,266', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,266', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,272', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,278', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,281', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,283', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,283', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,289', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,294', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,297', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,298', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,298', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,304', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,309', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,312', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,314', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,314', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,320', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,325', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,329', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,330', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,330', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,336', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,336', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,346', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'save_model(model=Ridge(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=None,']\n", - "[\"normalize=False, random_state=123, solver='auto', tol=0.001), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,407', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,413', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Ridge(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=None,']\n", - "[\"normalize=False, random_state=123, solver='auto', tol=0.001), None]\"]\n", - "['2020-07-31 08', '44', '26,413', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,413', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,453', 'INFO', 'Initializing Elastic Net']\n", - "['2020-07-31 08', '44', '26,458', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,463', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,467', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,468', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,468', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,474', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,480', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,483', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,485', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,485', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,490', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,496', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,498', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,500', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,500', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,505', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,511', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,514', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,517', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,523', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,528', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,530', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,532', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,532', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,538', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,538', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,552', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,618', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,618', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,618', 'INFO', 'save_model(model=ElasticNet(alpha=1.0, copy_X=True, fit_intercept=True, l1_ratio=0.5,']\n", - "['max_iter=1000, normalize=False, positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic', tol=0.0001, warm_start=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '26,619', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,623', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,627', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ElasticNet(alpha=1.0, copy_X=True, fit_intercept=True, l1_ratio=0.5,']\n", - "['max_iter=1000, normalize=False, positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic', tol=0.0001, warm_start=False), None]\"]\n", - "['2020-07-31 08', '44', '26,627', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,628', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,667', 'INFO', 'Initializing Least Angle Regression']\n", - "['2020-07-31 08', '44', '26,672', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,678', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,684', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,686', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,686', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,692', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,698', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,703', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,705', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,705', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,710', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,716', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,721', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,723', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,723', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,728', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,735', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,742', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,744', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,744', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,751', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,756', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,762', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,764', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,764', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,771', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,772', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,787', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'save_model(model=Lars(copy_X=True, eps=2.220446049250313e-16, fit_intercept=True, fit_path=True,']\n", - "[\"jitter=None, n_nonzero_coefs=500, normalize=True, precompute='auto',\"]\n", - "['random_state=None, verbose=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,857', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Lars(copy_X=True, eps=2.220446049250313e-16, fit_intercept=True, fit_path=True,']\n", - "[\"jitter=None, n_nonzero_coefs=500, normalize=True, precompute='auto',\"]\n", - "['random_state=None, verbose=False), None]']\n", - "['2020-07-31 08', '44', '26,857', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,857', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,889', 'INFO', 'Initializing Lasso Least Angle Regression']\n", - "['2020-07-31 08', '44', '26,909', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,918', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,923', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,924', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,924', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,932', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,937', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,943', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,945', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,945', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,954', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,961', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,967', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,968', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,969', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,975', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,982', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,988', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,990', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,990', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,997', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,003', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,009', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,012', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,012', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,021', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,021', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,032', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,089', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,090', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,090', 'INFO', 'save_model(model=LassoLars(alpha=1.0, copy_X=True, eps=2.220446049250313e-16, fit_intercept=True,']\n", - "['fit_path=True, jitter=None, max_iter=500, normalize=True,']\n", - "[\"positive=False, precompute='auto', random_state=None, verbose=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '27,090', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,095', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,100', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LassoLars(alpha=1.0, copy_X=True, eps=2.220446049250313e-16, fit_intercept=True,']\n", - "['fit_path=True, jitter=None, max_iter=500, normalize=True,']\n", - "[\"positive=False, precompute='auto', random_state=None, verbose=False), None]\"]\n", - "['2020-07-31 08', '44', '27,100', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,100', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,144', 'INFO', 'Initializing Orthogonal Matching Pursuit']\n", - "['2020-07-31 08', '44', '27,148', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,155', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,158', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,160', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,160', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,166', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,173', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,177', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,178', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,179', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,186', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '27,194', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,197', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,199', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,199', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,206', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '27,213', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,216', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,218', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,218', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,224', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,232', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,236', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '27,237', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,237', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,244', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,245', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,262', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,325', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,325', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,326', 'INFO', 'save_model(model=OrthogonalMatchingPursuit(fit_intercept=True, n_nonzero_coefs=None,']\n", - "[\"normalize=True, precompute='auto', tol=None), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '27,326', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,331', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,335', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), OrthogonalMatchingPursuit(fit_intercept=True, n_nonzero_coefs=None,']\n", - "[\"normalize=True, precompute='auto', tol=None), None]\"]\n", - "['2020-07-31 08', '44', '27,335', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,335', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,376', 'INFO', 'Initializing Bayesian Ridge']\n", - "['2020-07-31 08', '44', '27,381', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,387', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,393', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,395', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,396', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,403', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,410', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,415', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,417', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,417', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,423', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '27,429', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,434', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,435', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,436', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,441', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '27,447', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,455', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,457', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,457', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,463', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,474', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,476', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,476', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,482', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,482', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,493', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,550', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,551', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,551', 'INFO', 'save_model(model=BayesianRidge(alpha_1=1e-06, alpha_2=1e-06, alpha_init=None,']\n", - "['compute_score=False, copy_X=True, fit_intercept=True,']\n", - "['lambda_1=1e-06, lambda_2=1e-06, lambda_init=None, n_iter=300,']\n", - "['normalize=False, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '27,551', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,556', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,559', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), BayesianRidge(alpha_1=1e-06, alpha_2=1e-06, alpha_init=None,']\n", - "['compute_score=False, copy_X=True, fit_intercept=True,']\n", - "['lambda_1=1e-06, lambda_2=1e-06, lambda_init=None, n_iter=300,']\n", - "['normalize=False, tol=0.001, verbose=False), None]']\n", - "['2020-07-31 08', '44', '27,559', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,559', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,590', 'INFO', 'Initializing Passive Aggressive Regressor']\n", - "['2020-07-31 08', '44', '27,606', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,619', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,620', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,620', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,626', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,631', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,638', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,640', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,640', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,645', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '27,651', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,656', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,658', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,658', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,664', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '27,669', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,675', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,677', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,677', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,683', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,687', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,694', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,696', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,696', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,701', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,702', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,712', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,773', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,773', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,774', 'INFO', 'save_model(model=PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']\n", - "['epsilon=0.1, fit_intercept=True,']\n", - "[\"loss='epsilon_insensitive', max_iter=1000,\"]\n", - "['n_iter_no_change=5, random_state=123, shuffle=True,']\n", - "['tol=0.001, validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '27,774', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,775', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,783', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']\n", - "['epsilon=0.1, fit_intercept=True,']\n", - "[\"loss='epsilon_insensitive', max_iter=1000,\"]\n", - "['n_iter_no_change=5, random_state=123, shuffle=True,']\n", - "['tol=0.001, validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), None]']\n", - "['2020-07-31 08', '44', '27,783', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,783', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,826', 'INFO', 'Initializing Random Sample Consensus']\n", - "['2020-07-31 08', '44', '27,831', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,836', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,923', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,924', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,924', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,930', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,935', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,015', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,017', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,017', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,022', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '28,027', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,105', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,106', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,106', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,112', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '28,116', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,195', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,197', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,197', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,202', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '28,208', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,298', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,300', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,300', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,306', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '28,306', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '28,322', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'save_model(model=RANSACRegressor(base_estimator=None, is_data_valid=None, is_model_valid=None,']\n", - "[\"loss='absolute_loss', max_skips=inf, max_trials=100,\"]\n", - "['min_samples=0.5, random_state=123, residual_threshold=None,']\n", - "['stop_n_inliers=inf, stop_probability=0.99, stop_score=inf), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '28,396', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RANSACRegressor(base_estimator=None, is_data_valid=None, is_model_valid=None,']\n", - "[\"loss='absolute_loss', max_skips=inf, max_trials=100,\"]\n", - "['min_samples=0.5, random_state=123, residual_threshold=None,']\n", - "['stop_n_inliers=inf, stop_probability=0.99, stop_score=inf), None]']\n", - "['2020-07-31 08', '44', '28,396', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '28,396', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '28,441', 'INFO', 'Initializing TheilSen Regressor']\n", - "['2020-07-31 08', '44', '28,446', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '28,450', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '30,326', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '30,328', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '30,328', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '30,334', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '30,339', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '30,808', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '30,808', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '30,808', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '30,824', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '30,830', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '31,292', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '31,292', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '31,292', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '31,307', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '31,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '31,820', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '31,822', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '31,822', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '31,827', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '31,827', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,321', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,321', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,321', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,336', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '32,336', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '32,353', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '32,409', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '32,409', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'save_model(model=TheilSenRegressor(copy_X=True, fit_intercept=True, max_iter=300,']\n", - "['max_subpopulation=10000, n_jobs=-1, n_subsamples=None,']\n", - "['random_state=123, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), TheilSenRegressor(copy_X=True, fit_intercept=True, max_iter=300,']\n", - "['max_subpopulation=10000, n_jobs=-1, n_subsamples=None,']\n", - "['random_state=123, tol=0.001, verbose=False), None]']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '32,457', 'INFO', 'Initializing Huber Regressor']\n", - "['2020-07-31 08', '44', '32,457', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '32,468', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,520', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,522', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,522', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,527', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '32,527', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,580', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,580', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,586', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '32,591', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,636', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,638', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,638', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,643', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '32,650', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,690', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,692', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,692', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,697', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '32,702', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,749', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,750', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,750', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,756', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '32,756', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '32,761', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '32,821', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '32,822', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '32,822', 'INFO', 'save_model(model=HuberRegressor(alpha=0.0001, epsilon=1.35, fit_intercept=True, max_iter=100,']\n", - "['tol=1e-05, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '32,822', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '32,827', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '32,831', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), HuberRegressor(alpha=0.0001, epsilon=1.35, fit_intercept=True, max_iter=100,']\n", - "['tol=1e-05, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '32,831', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '32,831', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '32,860', 'INFO', 'Initializing Support Vector Machine']\n", - "['2020-07-31 08', '44', '32,860', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '32,880', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,938', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,942', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,943', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,948', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '32,953', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,976', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,981', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,981', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,986', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '32,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,013', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,018', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,018', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,024', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '33,029', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,053', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,058', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,058', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,062', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '33,067', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,096', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,096', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,101', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '33,102', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '33,113', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '33,175', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '33,176', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '33,176', 'INFO', \"save_model(model=SVR(C=1.0, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma='scale',\"]\n", - "[\"kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '33,176', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '33,177', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '33,177', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), SVR(C=1.0, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma='scale',\"]\n", - "[\"kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False), None]\"]\n", - "['2020-07-31 08', '44', '33,177', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '33,177', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '33,211', 'INFO', 'Initializing K Neighbors Regressor']\n", - "['2020-07-31 08', '44', '33,227', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '33,227', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,227', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,358', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,358', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,373', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '33,383', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,388', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,507', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,507', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,507', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '33,519', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,523', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,641', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,641', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,657', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '33,669', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,674', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,780', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,780', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,788', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '33,794', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,798', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '33,945', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '34,004', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '34,005', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '34,005', 'INFO', \"save_model(model=KNeighborsRegressor(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '34,005', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '34,010', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '34,011', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), KNeighborsRegressor(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform'), None]\"]\n", - "['2020-07-31 08', '44', '34,011', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '34,011', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '34,042', 'INFO', 'Initializing Decision Tree']\n", - "['2020-07-31 08', '44', '34,060', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '34,065', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,070', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,072', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,072', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,078', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '34,084', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,089', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,090', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,090', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,096', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '34,101', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,105', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,107', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,107', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,113', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '34,118', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,122', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,124', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,124', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,130', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '34,135', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,140', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,141', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,141', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,147', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '34,147', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '34,159', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '34,216', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '34,217', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '34,217', 'INFO', \"save_model(model=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '34,217', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '34,222', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '34,226', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), None]\"]\n", - "['2020-07-31 08', '44', '34,226', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '34,226', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '34,259', 'INFO', 'Initializing Random Forest']\n", - "['2020-07-31 08', '44', '34,259', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '34,276', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,425', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,550', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,550', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,550', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '34,561', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,708', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,813', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,814', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,828', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '34,844', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '35,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '35,197', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '35,197', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '35,203', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '35,208', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '35,456', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '35,575', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '35,575', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '35,582', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '35,590', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '35,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '35,981', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', \"save_model(model=RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '36,123', 'INFO', 'Initializing Extra Trees Regressor']\n", - "['2020-07-31 08', '44', '36,123', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '36,141', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '36,290', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '36,396', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '36,396', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '36,412', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '36,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '36,574', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '36,684', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '36,684', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '36,684', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '36,699', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '36,842', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '36,962', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '36,962', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '36,977', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '36,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,141', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,267', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,267', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,282', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '37,299', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,441', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '37,573', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', \"save_model(model=ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '37,739', 'INFO', 'Initializing AdaBoost Regressor']\n", - "['2020-07-31 08', '44', '37,739', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '37,758', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,782', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,785', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,785', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,790', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '37,797', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,817', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,820', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,820', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,827', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '37,833', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,851', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,854', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,854', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,861', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '37,866', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,882', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,884', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,884', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,891', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '37,897', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,916', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,918', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,918', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,925', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '37,925', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '37,939', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '37,998', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '37,998', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '37,999', 'INFO', \"save_model(model=AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '37,999', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '38,008', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '38,013', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), None]']\n", - "['2020-07-31 08', '44', '38,013', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '38,013', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '38,045', 'INFO', 'Initializing Gradient Boosting Regressor']\n", - "['2020-07-31 08', '44', '38,045', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '38,066', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,130', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,145', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,145', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,145', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '38,159', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '38,245', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,320', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,320', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,326', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '38,332', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '38,415', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,484', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,486', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,486', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,492', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '38,492', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '38,508', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', \"save_model(model=GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '38,578', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '38,578', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '38,578', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '38,625', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 08', '44', '38,625', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '38,642', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,685', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,686', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,687', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,697', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '38,711', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,753', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,755', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,755', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,773', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '38,783', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,827', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,829', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,829', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,846', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '38,855', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,899', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,901', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,901', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,914', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '38,926', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,968', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,970', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,970', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,982', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '38,983', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '39,014', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', \"save_model(model=XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '39,112', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), None]']\n", - "['2020-07-31 08', '44', '39,112', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '39,112', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '39,143', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 08', '44', '39,159', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '39,165', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,231', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,246', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,246', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,246', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '39,269', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,361', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,365', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,365', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,378', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '39,388', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,482', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,486', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,486', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,499', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '39,510', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,581', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,581', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,581', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,596', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '39,608', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,693', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,697', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,697', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,710', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '39,710', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '39,742', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '39,836', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '39,836', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '39,837', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '39,837', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '39,956', 'INFO', 'Initializing CatBoost Regressor']\n", - "['2020-07-31 08', '44', '39,961', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '39,969', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '41,306', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '41,306', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '41,306', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '41,322', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '41,330', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '42,400', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '42,402', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '42,403', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '42,410', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '42,416', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '43,476', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '43,492', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '43,492', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '43,492', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '43,504', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '44,627', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '45,723', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '45,774', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '45,775', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '45,775', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '45,775', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '45,813', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '45,834', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), , None]']\n", - "['2020-07-31 08', '44', '45,834', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '45,834', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '45,916', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 08', '44', '45,916', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'create_model(estimator=xgboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '44', '45,935', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '44', '45,935', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '44', '45,936', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '44', '45,936', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '44', '45,937', 'INFO', 'Extreme Gradient Boosting Regressor Imported succesfully']\n", - "['2020-07-31 08', '44', '45,937', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '44', '45,938', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '45,939', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '45,977', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '45,979', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '45,979', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '45,990', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '45,992', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,031', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,033', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,033', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,044', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '46,048', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,067', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '46,145', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,176', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,176', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,176', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,192', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '44', '46,192', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,223', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,223', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,223', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,239', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '44', '46,239', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,270', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,270', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,270', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,286', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '44', '46,286', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,335', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,337', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,337', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,349', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '44', '46,350', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,397', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,397', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,397', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,412', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '44', '46,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,459', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,459', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,475', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '46,475', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '46,490', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'display_container', '1']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', \"XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'display_container', '2']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', \"XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '06,693', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '06,693', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '06,694', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '06,694', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '06,694', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '06,717', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '06,717', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '06,718', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '06,718', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '06,722', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '06,723', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '06,728', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '06,733', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '06,819', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '06,823', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '06,823', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '06,852', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '06,860', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '06,951', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '06,955', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '06,955', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '06,984', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '06,992', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,090', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,094', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,094', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,123', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '07,132', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,207', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,207', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,207', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,246', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '07,255', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,339', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,343', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,343', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,374', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '07,383', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,466', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,469', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,469', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,499', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '07,507', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,591', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,595', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,595', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,626', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '07,635', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,717', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,721', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,721', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,753', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '07,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,842', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,842', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,842', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,877', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '07,885', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,972', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,975', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '08,009', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '08,011', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '08,024', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '08,113', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '08,329', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '08,329', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '08,330', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '08,330', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '08,349', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '08,360', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '08,360', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '08,361', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '08,401', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '08,401', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'create_model_container', '2']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'master_model_container', '2']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'display_container', '3']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '09,735', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '09,754', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '09,755', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '09,756', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '09,756', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '09,761', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '09,761', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '09,766', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '09,771', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '09,853', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '09,857', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '09,857', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '09,886', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '09,894', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '09,980', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '09,984', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '09,984', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,013', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '10,023', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,104', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,108', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,108', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,137', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '10,145', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,250', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,253', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,254', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,285', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '10,294', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,393', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,396', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,397', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,426', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '10,435', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,516', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,520', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,520', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,542', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '10,565', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,650', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,654', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,654', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,685', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '10,693', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,777', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,780', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,781', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,812', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '10,821', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,905', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,910', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,910', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,948', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '10,957', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '11,041', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '11,045', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '11,045', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '11,075', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '11,077', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '11,094', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '11,191', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '11,397', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '11,397', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '11,398', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '11,399', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '11,417', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '11,427', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '11,428', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '11,428', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '11,465', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '11,465', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '11,521', 'INFO', 'create_model_container', '3']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', 'master_model_container', '3']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', 'display_container', '4']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '11,540', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '11,541', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '11,542', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '11,542', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '11,546', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '11,547', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '11,551', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '11,557', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '11,638', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '11,642', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '11,642', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '11,670', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '11,679', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '11,784', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '11,788', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '11,788', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '11,812', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '11,820', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,003', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,007', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,007', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,037', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '12,046', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,125', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,126', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,126', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,159', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '12,168', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,250', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,254', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,254', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,285', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '12,294', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,383', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,387', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,387', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,417', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '12,426', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,492', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,508', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,508', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,542', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '12,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,660', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,663', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,664', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,698', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '12,708', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,794', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,798', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,798', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,830', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '12,838', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,921', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,925', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,925', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,959', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '12,961', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '12,975', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '13,077', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '13,302', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '13,303', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '13,304', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.2, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '13,304', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '13,323', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '13,335', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.2, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '13,335', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '13,335', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '13,373', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '13,373', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', 'create_model_container', '4']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', 'master_model_container', '4']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', 'display_container', '5']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.2, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '13,452', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '13,452', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '13,453', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '13,453', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '13,458', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '13,458', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '13,463', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '13,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,542', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,542', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,542', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,579', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '13,588', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,659', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,659', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,659', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,700', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '13,708', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,776', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,776', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,776', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,820', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '13,828', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,910', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,910', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,910', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,943', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '13,951', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,043', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,043', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,043', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,081', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '14,090', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,196', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,200', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,200', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,230', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '14,240', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,334', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,337', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,338', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,370', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '14,379', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,463', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,467', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,467', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,498', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '14,507', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,588', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,592', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,592', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,625', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '14,634', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,732', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,736', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,736', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,767', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '14,769', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '14,783', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '14,871', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '15,089', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '15,090', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '15,091', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.30000000000000004,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '15,091', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '15,110', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '15,122', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.30000000000000004,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '15,122', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '15,122', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '15,159', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '15,159', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'display_container', '6']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.30000000000000004,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0)']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '15,236', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '15,237', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '15,238', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '15,238', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '15,242', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '15,243', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '15,247', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '15,252', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,327', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,327', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,327', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,364', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '15,373', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,457', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,461', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,461', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,489', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '15,497', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,578', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,578', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,578', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,610', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '15,619', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,726', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,730', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,730', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,759', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '15,769', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,861', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,865', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,865', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,897', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '15,906', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,004', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,008', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,039', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '16,049', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,142', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,146', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,147', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,180', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '16,189', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,280', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,284', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,284', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,315', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '16,325', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,410', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,414', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,414', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,449', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '16,458', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,553', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,557', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,557', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,592', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '16,594', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '16,608', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '16,701', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '16,919', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '16,920', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '16,921', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.4, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '16,922', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '16,944', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '16,956', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.4, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '16,956', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '16,956', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '16,995', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '16,995', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '17,052', 'INFO', 'create_model_container', '6']\n", - "['2020-07-31 08', '45', '17,052', 'INFO', 'master_model_container', '6']\n", - "['2020-07-31 08', '45', '17,053', 'INFO', 'display_container', '7']\n", - "['2020-07-31 08', '45', '17,053', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.4, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '17,053', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '17,072', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '17,072', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '17,073', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '17,074', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '17,078', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '17,079', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '17,083', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '17,087', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,160', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,160', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,160', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,198', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '17,207', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,292', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,296', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,296', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,323', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '17,333', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,428', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,432', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,432', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,465', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '17,474', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,575', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,578', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,579', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,610', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '17,618', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,703', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,707', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,707', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,738', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '17,744', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,830', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,834', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,834', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,865', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '17,873', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,945', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,961', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,961', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,992', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '18,001', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '18,090', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '18,094', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '18,094', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '18,128', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '18,140', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '18,227', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '18,232', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '18,232', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '18,268', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '18,276', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '18,360', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '18,364', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '18,365', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '18,399', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '18,401', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '18,414', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '18,521', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.5, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '18,795', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '18,811', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.5, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '18,811', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '18,811', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '18,857', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '18,857', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'create_model_container', '7']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'master_model_container', '7']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'display_container', '8']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.5, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '18,934', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '18,935', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '18,935', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '18,936', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '18,940', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '18,941', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '18,946', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '18,951', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,042', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,046', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,047', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,076', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '19,087', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,162', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,162', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,205', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '19,214', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,296', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,296', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,296', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,330', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '19,339', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,424', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,428', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,428', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,458', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '19,467', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,578', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,578', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,578', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,618', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '19,628', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,716', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,720', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,720', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,752', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '19,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,843', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,847', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,848', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,881', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '19,890', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,986', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,990', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,990', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,023', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '20,032', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,122', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,126', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,126', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,163', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '20,172', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,246', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,246', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,246', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,292', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '20,294', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '20,309', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '20,394', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '20,611', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '20,612', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '20,613', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.6, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '20,613', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '20,630', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '20,645', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.6, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '20,645', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '20,645', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '20,692', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '20,692', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '20,742', 'INFO', 'create_model_container', '8']\n", - "['2020-07-31 08', '45', '20,742', 'INFO', 'master_model_container', '8']\n", - "['2020-07-31 08', '45', '20,742', 'INFO', 'display_container', '9']\n", - "['2020-07-31 08', '45', '20,743', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.6, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '20,743', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '20,760', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '20,760', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '20,761', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '20,761', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '20,765', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '20,766', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '20,770', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '20,777', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,846', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,846', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,846', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,888', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '20,897', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,996', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,996', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,996', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,041', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '21,051', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,162', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,200', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '21,215', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,297', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,313', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,313', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,346', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '21,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,450', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,454', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,454', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,485', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '21,497', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,597', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,601', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,601', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,634', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '21,643', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,742', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,747', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,747', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,782', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '21,795', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,879', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,879', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,879', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,924', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '21,934', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '22,027', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '22,043', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '22,043', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '22,084', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '22,093', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '22,195', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '22,195', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '22,195', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '22,245', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '22,248', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '22,266', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '22,362', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '22,584', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '22,584', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '22,586', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.7000000000000001,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '22,586', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '22,609', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '22,614', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.7000000000000001,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '22,614', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '22,614', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '22,692', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '22,692', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '22,739', 'INFO', 'create_model_container', '9']\n", - "['2020-07-31 08', '45', '22,739', 'INFO', 'master_model_container', '9']\n", - "['2020-07-31 08', '45', '22,739', 'INFO', 'display_container', '10']\n", - "['2020-07-31 08', '45', '22,743', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.7000000000000001,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0)']\n", - "['2020-07-31 08', '45', '22,743', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '22,744', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '22,799', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '22,802', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '22,803', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '22,803', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '22,812', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '22,812', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '22,827', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '22,844', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '22,930', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '22,930', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '22,930', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '22,969', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '22,979', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,064', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,064', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,064', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,098', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '23,113', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,197', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,197', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,197', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,235', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '23,244', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,330', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,331', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,331', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,365', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '23,375', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,498', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,502', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,503', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,544', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '23,554', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,660', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,664', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,664', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,699', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '23,710', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,811', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,816', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,816', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,851', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '23,861', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,947', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,947', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,947', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,987', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '23,996', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,081', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,081', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,081', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '24,122', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '24,132', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,229', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,229', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,229', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '24,271', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '24,273', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '24,288', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '24,380', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '24,596', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '24,597', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '24,598', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.8, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '24,598', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '24,614', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '24,614', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.8, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '24,629', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '24,629', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '24,660', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '24,660', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'create_model_container', '10']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'master_model_container', '10']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'display_container', '11']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.8, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '24,744', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '24,744', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '24,745', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '24,745', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '24,750', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '24,750', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '24,755', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '24,760', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,841', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,845', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,845', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '24,875', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '24,884', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,965', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,965', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,965', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,005', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '25,015', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,130', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,130', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,130', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,165', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '25,165', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,280', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,280', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,280', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,318', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '25,327', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,423', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,427', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,427', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,460', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '25,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,572', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,577', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,577', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,612', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '25,621', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,698', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,698', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,698', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,747', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '25,755', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,832', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,832', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,832', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,878', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '25,887', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,981', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,986', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,986', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '26,023', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '26,034', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '26,137', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '26,142', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '26,142', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '26,180', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '26,182', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '26,197', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '26,299', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '26,531', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '26,532', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '26,533', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.9, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '26,533', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '26,548', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '26,564', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.9, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '26,564', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '26,564', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '26,626', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '26,626', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '26,673', 'INFO', 'create_model_container', '11']\n", - "['2020-07-31 08', '45', '26,673', 'INFO', 'master_model_container', '11']\n", - "['2020-07-31 08', '45', '26,673', 'INFO', 'display_container', '12']\n", - "['2020-07-31 08', '45', '26,675', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.9, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '26,675', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '35,225', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 08', '45', '35,225', 'INFO', \"tune_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), fold=10, round=4, n_iter=50, custom_grid=None, optimize=MAE, choose_better=False, verbose=True)']\n", - "['2020-07-31 08', '45', '35,226', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '35,226', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '35,226', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '35,246', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '35,246', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '35,247', 'INFO', 'Checking base model']\n", - "['2020-07-31 08', '45', '35,248', 'INFO', 'Base model', 'Light Gradient Boosting Machine']\n", - "['2020-07-31 08', '45', '35,249', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '35,249', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '35,255', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 08', '45', '35,255', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 08', '45', '37,358', 'INFO', 'Random search completed']\n", - "['2020-07-31 08', '45', '37,367', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '37,377', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,389', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,392', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,423', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '37,431', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,444', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,447', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,478', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '37,488', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,500', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,504', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,536', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '37,545', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,564', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,567', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,598', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '37,608', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,621', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,625', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,656', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '37,664', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,677', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,681', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,717', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '37,726', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,738', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,741', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,778', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '37,788', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,802', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,806', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,841', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '37,851', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,863', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,866', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,903', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '37,913', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,926', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,930', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,967', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '37,969', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '37,984', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '37,996', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '37,996', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '37,997', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '38,113', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '38,113', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '38,114', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.3, max_depth=70,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.2,']\n", - "['n_estimators=10, n_jobs=-1, num_leaves=10, objective=None,']\n", - "['random_state=123, reg_alpha=0.4, reg_lambda=0.1, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '38,114', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '38,121', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '38,132', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.3, max_depth=70,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.2,']\n", - "['n_estimators=10, n_jobs=-1, num_leaves=10, objective=None,']\n", - "['random_state=123, reg_alpha=0.4, reg_lambda=0.1, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '38,132', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,132', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '38,394', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 08', '45', '38,394', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 08', '45', '38,395', 'INFO', 'display_container', '13']\n", - "['2020-07-31 08', '45', '38,395', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.3, max_depth=70,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.2,']\n", - "['n_estimators=10, n_jobs=-1, num_leaves=10, objective=None,']\n", - "['random_state=123, reg_alpha=0.4, reg_lambda=0.1, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '38,395', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,408', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'create_model(estimator=dt, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '38,428', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '38,428', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '38,429', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '38,430', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '38,435', 'INFO', 'Decision Tree Regressor Imported succesfully']\n", - "['2020-07-31 08', '45', '38,437', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '38,440', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '38,446', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,451', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,453', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,453', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,467', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '38,472', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,479', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,479', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,493', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '38,500', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,505', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,507', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,507', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,521', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '38,527', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,532', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,534', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,534', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,549', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '38,555', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,560', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,562', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,562', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,577', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '38,583', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,588', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,590', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,590', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,606', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '38,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,617', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,619', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,619', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,635', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '38,640', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,647', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,648', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,648', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,664', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '38,671', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,675', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,677', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,677', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,693', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '38,698', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,704', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,705', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,705', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,722', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '38,723', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '38,731', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '38,739', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '38,888', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '38,888', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '38,889', 'INFO', \"save_model(model=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '45', '38,889', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '38,895', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '38,900', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), None]\"]\n", - "['2020-07-31 08', '45', '38,900', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,901', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '38,918', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '38,918', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '38,949', 'INFO', 'create_model_container', '13']\n", - "['2020-07-31 08', '45', '38,949', 'INFO', 'master_model_container', '13']\n", - "['2020-07-31 08', '45', '38,949', 'INFO', 'display_container', '14']\n", - "['2020-07-31 08', '45', '38,950', 'INFO', \"DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')\"]\n", - "['2020-07-31 08', '45', '38,950', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', \"ensemble_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Bagging, fold=10, n_estimators=50, round=4, choose_better=False, optimize=R2, verbose=True)\"]\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '38,978', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '38,978', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '38,980', 'INFO', 'Checking base model']\n", - "['2020-07-31 08', '45', '38,981', 'INFO', 'Base model', 'Decision Tree']\n", - "['2020-07-31 08', '45', '38,985', 'INFO', 'BaggingRegressor() succesfully imported']\n", - "['2020-07-31 08', '45', '38,990', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '38,991', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '38,996', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,156', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,178', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '39,183', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,330', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,335', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,350', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '39,355', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,486', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '39,486', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,515', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '39,521', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,651', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,666', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,684', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '39,689', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,816', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,816', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,844', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '39,849', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,986', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,986', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,007', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '40,012', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,154', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,154', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,178', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '40,183', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,327', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,332', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,348', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '40,353', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,503', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,528', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '40,533', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,698', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,704', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,721', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '40,722', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '40,730', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '40,882', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '40,882', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '40,883', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '40,950', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '40,951', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '40,952', 'INFO', 'save_model(model=BaggingRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '40,952', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '40,976', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '40,981', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), BaggingRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '45', '40,981', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '40,981', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'create_model_container', '14']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'master_model_container', '14']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'display_container', '15']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'BaggingRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '41,133', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 08', '45', '41,134', 'INFO', \"ensemble_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Boosting, fold=10, n_estimators=10, round=4, choose_better=False, optimize=R2, verbose=True)\"]\n", - "['2020-07-31 08', '45', '41,134', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '41,134', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '41,134', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '41,157', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '41,157', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '41,159', 'INFO', 'Checking base model']\n", - "['2020-07-31 08', '45', '41,160', 'INFO', 'Base model', 'Decision Tree']\n", - "['2020-07-31 08', '45', '41,166', 'INFO', 'AdaBoostRegressor() succesfully imported']\n", - "['2020-07-31 08', '45', '41,172', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '41,172', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '41,179', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,214', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,228', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '41,233', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,265', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,268', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,283', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '41,288', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,322', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,325', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,339', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '41,345', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,378', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,380', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,395', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '41,399', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,443', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,445', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,460', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '41,465', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,496', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,499', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,516', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '41,521', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,555', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,557', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,573', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '41,578', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,616', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,619', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,638', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '41,644', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,686', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,690', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,707', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '41,713', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,749', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,751', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,768', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '41,768', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '41,776', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '41,814', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '41,814', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '41,814', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '41,869', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '41,869', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '41,870', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '41,871', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '41,878', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '41,883', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '45', '41,883', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '41,883', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '42,011', 'INFO', 'create_model_container', '15']\n", - "['2020-07-31 08', '45', '42,011', 'INFO', 'master_model_container', '15']\n", - "['2020-07-31 08', '45', '42,011', 'INFO', 'display_container', '16']\n", - "['2020-07-31 08', '45', '42,012', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '45', '42,012', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Initializing blend_models()']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'blend_models(estimator_list=All, fold=10, round=4, choose_better=False, optimize=R2, turbo=True, verbose=True)']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '42,034', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '42,034', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '42,036', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '42,036', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '42,041', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 08', '45', '42,041', 'INFO', 'Import successful']\n", - "['2020-07-31 08', '45', '42,042', 'INFO', 'Defining model names in estimator_list']\n", - "['2020-07-31 08', '45', '45,250', 'INFO', 'n_jobs multiple passed']\n", - "['2020-07-31 08', '45', '45,265', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '45,280', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '48,335', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '48,715', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '48,739', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '48,753', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '51,531', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '51,907', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '51,935', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '51,944', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '54,960', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '55,340', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '55,370', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '55,380', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '58,319', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '58,719', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '58,743', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '58,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '01,634', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '02,022', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '02,053', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '02,064', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '04,996', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '05,375', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '05,404', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '05,415', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '08,454', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '08,850', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '08,884', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '08,894', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '11,712', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '12,102', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '12,118', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '12,134', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '14,865', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '15,254', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '15,270', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '15,286', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '18,564', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '18,970', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '19,005', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '19,007', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '19,022', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '22,593', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '22,593', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '22,594', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '22,641', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '22,642', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '22,679', 'INFO', \"save_model(model=VotingRegressor(estimators=[('Linear Regression_0',\"]\n", - "['LinearRegression(copy_X=True, fit_intercept=True,']\n", - "['n_jobs=-1, normalize=False)),']\n", - "[\"('Lasso_1',\"]\n", - "['Lasso(alpha=1.0, copy_X=True, fit_intercept=True,']\n", - "['max_iter=1000, normalize=False,']\n", - "['positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic',\"]\n", - "['tol=0.0001, warm_start=False)),']\n", - "[\"('Ridge_2',\"]\n", - "['Ridge(alpha=1.0, copy_X=True...']\n", - "['min_child_samples=20,']\n", - "['min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100,']\n", - "['n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123,']\n", - "['reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0,']\n", - "['subsample_for_bin=200000,']\n", - "['subsample_freq=0)),']\n", - "[\"('CatBoost Regressor_21',\"]\n", - "[')],']\n", - "['n_jobs=-1, verbose=False, weights=None), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '22,679', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '22,831', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '22,915', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), VotingRegressor(estimators=[('Linear Regression_0',\"]\n", - "['LinearRegression(copy_X=True, fit_intercept=True,']\n", - "['n_jobs=-1, normalize=False)),']\n", - "[\"('Lasso_1',\"]\n", - "['Lasso(alpha=1.0, copy_X=True, fit_intercept=True,']\n", - "['max_iter=1000, normalize=False,']\n", - "['positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic',\"]\n", - "['tol=0.0001, warm_start=False)),']\n", - "[\"('Ridge_2',\"]\n", - "['Ridge(alpha=1.0, copy_X=True...']\n", - "['min_child_samples=20,']\n", - "['min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100,']\n", - "['n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123,']\n", - "['reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0,']\n", - "['subsample_for_bin=200000,']\n", - "['subsample_freq=0)),']\n", - "[\"('CatBoost Regressor_21',\"]\n", - "[')],']\n", - "['n_jobs=-1, verbose=False, weights=None), None]']\n", - "['2020-07-31 08', '46', '22,915', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '22,915', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '23,715', 'INFO', 'create_model_container', '16']\n", - "['2020-07-31 08', '46', '23,715', 'INFO', 'master_model_container', '16']\n", - "['2020-07-31 08', '46', '23,715', 'INFO', 'display_container', '17']\n", - "['2020-07-31 08', '46', '23,735', 'INFO', \"VotingRegressor(estimators=[('Linear Regression_0',\"]\n", - "['LinearRegression(copy_X=True, fit_intercept=True,']\n", - "['n_jobs=-1, normalize=False)),']\n", - "[\"('Lasso_1',\"]\n", - "['Lasso(alpha=1.0, copy_X=True, fit_intercept=True,']\n", - "['max_iter=1000, normalize=False,']\n", - "['positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic',\"]\n", - "['tol=0.0001, warm_start=False)),']\n", - "[\"('Ridge_2',\"]\n", - "['Ridge(alpha=1.0, copy_X=True...']\n", - "['min_child_samples=20,']\n", - "['min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100,']\n", - "['n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123,']\n", - "['reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0,']\n", - "['subsample_for_bin=200000,']\n", - "['subsample_freq=0)),']\n", - "[\"('CatBoost Regressor_21',\"]\n", - "[')],']\n", - "['n_jobs=-1, verbose=False, weights=None)']\n", - "['2020-07-31 08', '46', '23,735', 'INFO', 'blend_models() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', \"compare_models(blacklist=None, whitelist=['rf', 'et', 'ada', 'gbr', 'xgboost', 'lightgbm', 'catboost'], fold=5, round=4, sort=R2, n_select=5, turbo=True, verbose=True)\"]\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '23,764', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '23,765', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '23,770', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 08', '46', '23,771', 'INFO', 'Import successful']\n", - "['2020-07-31 08', '46', '23,777', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '23,777', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '23,777', 'INFO', 'Initializing Random Forest']\n", - "['2020-07-31 08', '46', '23,782', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '23,789', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '24,034', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '24,142', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '24,143', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '24,164', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '24,176', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '24,434', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '24,549', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '24,549', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '24,561', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '24,578', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '24,918', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '25,038', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '25,038', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '25,064', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '25,081', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '25,328', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '25,435', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '25,436', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '25,448', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '25,458', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '25,707', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '25,838', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', \"save_model(model=RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '25,987', 'INFO', 'Initializing Extra Trees Regressor']\n", - "['2020-07-31 08', '46', '25,992', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '25,998', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '26,142', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '26,268', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '26,268', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '26,284', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '26,303', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '26,440', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '26,546', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '26,546', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '26,553', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '26,563', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '26,705', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '26,821', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '26,821', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '26,836', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '26,852', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,011', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,117', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,118', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,139', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '27,139', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '27,436', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '27,502', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '27,502', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '27,503', 'INFO', \"save_model(model=ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '27,503', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '27,523', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '27,539', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '46', '27,539', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '27,539', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '27,586', 'INFO', 'Initializing AdaBoost Regressor']\n", - "['2020-07-31 08', '46', '27,601', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '27,601', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '27,647', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,663', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,665', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,665', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,670', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,689', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '27,689', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '27,721', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '27,752', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', \"save_model(model=AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), None]']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '27,846', 'INFO', 'Initializing Gradient Boosting Regressor']\n", - "['2020-07-31 08', '46', '27,846', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '27,861', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,924', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,924', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,924', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,939', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '27,939', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,002', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '28,189', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,252', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,252', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,252', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,267', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '28,267', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '28,267', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', \"save_model(model=GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '28,408', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 08', '46', '28,408', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '28,424', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,471', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,471', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,471', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,486', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '28,502', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,549', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,549', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,549', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,564', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '28,580', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,611', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,611', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,611', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,627', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '28,642', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,689', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,689', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,689', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,705', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '28,720', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,767', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,783', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,783', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,799', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '28,799', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '28,830', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', \"save_model(model=XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), None]']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '29,017', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 08', '46', '29,017', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '29,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,127', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,127', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,127', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,142', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '29,158', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,252', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,267', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,267', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,283', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '29,283', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,392', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,392', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,392', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,423', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '29,423', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,533', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,533', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,533', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,548', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '29,564', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,658', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,673', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,673', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,689', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '29,689', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '29,720', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '29,861', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '29,876', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '46', '29,876', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '29,876', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '29,970', 'INFO', 'Initializing CatBoost Regressor']\n", - "['2020-07-31 08', '46', '29,970', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '29,986', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '31,376', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '31,392', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '31,392', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '31,392', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '31,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '32,847', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '32,863', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '32,863', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '32,863', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '32,878', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '34,175', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '34,175', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '34,175', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '34,190', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '34,190', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '35,598', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,028', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,028', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '37,028', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,043', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '37,043', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '37,059', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), , None]']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '37,184', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 08', '46', '37,184', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'create_model(estimator=xgboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Extreme Gradient Boosting Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,246', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,246', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,246', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,262', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '37,262', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,309', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,309', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,309', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,325', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '37,325', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,371', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,371', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,371', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,387', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '37,387', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,434', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,434', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,434', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,449', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '37,449', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,496', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,496', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,496', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,512', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '37,512', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,559', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,559', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,559', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,574', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '37,590', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,621', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,637', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,637', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,653', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '37,653', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,699', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,699', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,699', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,715', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '37,715', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,762', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,762', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,762', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,778', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '37,778', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,840', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,840', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,856', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '37,856', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '37,871', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'create_model_container', '17']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'master_model_container', '17']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'display_container', '18']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', \"XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'create_model(estimator=gbr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Gradient Boosting Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,324', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,324', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,324', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,340', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '38,340', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,418', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,418', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,418', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,434', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '38,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,590', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,590', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,590', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,605', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '38,605', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '38,933', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'create_model_container', '18']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'master_model_container', '18']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'display_container', '19']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', \"GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False)']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'create_model(estimator=catboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'CatBoost Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '41,620', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '41,620', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '41,620', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '41,636', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '41,636', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '42,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '45,653', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '45,653', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '45,653', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '45,669', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '45,669', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '47,181', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '47,181', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '47,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '47,197', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '47,197', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '48,509', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '48,509', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '48,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '48,524', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '48,524', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '49,928', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '49,939', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '49,940', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '49,953', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '49,955', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '51,527', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '51,530', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '51,530', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '51,540', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '51,542', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '53,254', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '53,260', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '53,260', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '53,270', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '53,272', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '53,276', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '54,768', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '54,768', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '54,768', 'INFO', 'create_model_container', '19']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', 'master_model_container', '19']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', 'display_container', '20']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', '']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'create_model(estimator=rf, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '54,786', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '54,787', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '54,787', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '54,788', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '54,788', 'INFO', 'Random Forest Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '54,789', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '54,790', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '54,792', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '55,056', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '55,173', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '55,173', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '55,183', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '55,185', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '55,444', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '55,811', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '56,191', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '56,303', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '56,303', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '56,310', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '56,311', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '56,564', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '56,678', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '56,678', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '56,684', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '56,685', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '56,948', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '57,053', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '57,055', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '57,066', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '57,066', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '57,232', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '57,338', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '57,338', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '57,348', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '57,349', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '57,609', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '57,724', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '57,724', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '57,726', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '57,740', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '57,980', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '58,350', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,456', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,456', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,464', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '58,465', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '58,469', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'create_model_container', '20']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'master_model_container', '20']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'display_container', '21']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', \"RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '58,766', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '58,767', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '58,768', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '58,768', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '58,768', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '46', '58,769', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '58,770', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '58,772', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '58,848', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,848', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,848', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,864', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '58,864', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '58,926', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,942', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,942', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,942', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '58,958', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,037', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,041', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,041', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,053', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '59,055', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,148', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,152', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,153', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,164', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '59,166', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,250', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,250', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,250', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,265', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '59,265', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,359', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,375', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,375', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,375', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '59,390', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,492', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,497', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,497', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,510', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '59,513', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,629', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,634', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,634', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,649', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '59,652', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,760', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,765', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,765', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,778', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '59,780', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,935', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,941', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,941', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,956', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '59,959', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '59,969', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '47', '00,131', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '47', '00,131', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '47', '00,131', 'INFO', 'create_model_container', '21']\n", - "['2020-07-31 08', '47', '00,132', 'INFO', 'master_model_container', '21']\n", - "['2020-07-31 08', '47', '00,132', 'INFO', 'display_container', '22']\n", - "['2020-07-31 08', '47', '00,133', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '47', '00,133', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '00,133', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 08', '47', '00,231', 'INFO', 'create_model_container', '21']\n", - "['2020-07-31 08', '47', '00,231', 'INFO', 'master_model_container', '21']\n", - "['2020-07-31 08', '47', '00,231', 'INFO', 'display_container', '23']\n", - "['2020-07-31 08', '47', '00,233', 'INFO', \"[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 08', '47', '00,233', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '00,241', 'INFO', 'Initializing stack_models()']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', \"stack_models(estimator_list=[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)], meta_model=None, fold=10, round=4, restack=True, plot=False, choose_better=False, optimize=R2, finalize=False, verbose=True)']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', 'Copying estimator list']\n", - "['2020-07-31 08', '47', '00,296', 'INFO', 'Defining meta model']\n", - "['2020-07-31 08', '47', '00,299', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '00,346', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '00,348', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '47', '00,349', 'INFO', 'Getting model names']\n", - "['2020-07-31 08', '47', '00,356', 'INFO', 'Checking base model', 'XGBRegressor']\n", - "['2020-07-31 08', '47', '00,367', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '00,435', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '01,084', 'INFO', 'Checking base model', 'GradientBoostingRegressor']\n", - "['2020-07-31 08', '47', '01,096', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '01,257', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '02,082', 'INFO', 'Checking base model', 'CatBoostRegressor']\n", - "['2020-07-31 08', '47', '02,097', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '03,663', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '24,424', 'INFO', 'Checking base model', 'RandomForestRegressor']\n", - "['2020-07-31 08', '47', '24,430', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '24,814', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '28,106', 'INFO', 'Checking base model', 'LGBMRegressor']\n", - "['2020-07-31 08', '47', '28,120', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '28,227', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '29,899', 'INFO', 'Base layer complete']\n", - "['2020-07-31 08', '47', '29,916', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '47', '29,919', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '47', '29,935', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '29,942', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '29,948', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '29,990', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '47', '29,999', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,006', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,031', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '47', '30,044', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,052', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,057', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,089', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '47', '30,101', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,108', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,112', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,141', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '47', '30,153', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,158', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,163', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,190', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '47', '30,200', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,206', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,208', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,237', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '47', '30,247', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,253', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,255', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,280', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '47', '30,289', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,296', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,300', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,321', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '47', '30,330', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,335', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,338', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,369', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '47', '30,380', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,387', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,390', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,419', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '47', '30,420', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '47', '30,429', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '47', '30,430', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '47', '30,431', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '47', '30,542', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '30,542', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '30,547', 'INFO', \"save_model(model=[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), True], model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '47', '30,547', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '30,631', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '30,651', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), [XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), True], None]']\n", - "['2020-07-31 08', '47', '30,652', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '30,652', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '31,205', 'INFO', 'create_model_container', '22']\n", - "['2020-07-31 08', '47', '31,205', 'INFO', 'master_model_container', '22']\n", - "['2020-07-31 08', '47', '31,205', 'INFO', 'display_container', '24']\n", - "['2020-07-31 08', '47', '31,209', 'INFO', \"[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), True]']\n", - "['2020-07-31 08', '47', '31,209', 'INFO', 'stack_models() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '31,222', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '31,223', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=residuals, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '31,223', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '31,224', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '31,224', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '31,239', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '31,240', 'INFO', 'plot type', 'residuals']\n", - "['2020-07-31 08', '47', '31,385', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '31,427', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 08', '47', '32,278', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,279', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,288', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '32,289', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=error, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '32,289', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,289', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '32,290', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '32,300', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,301', 'INFO', 'plot type', 'error']\n", - "['2020-07-31 08', '47', '32,302', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '32,303', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 08', '47', '32,533', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,533', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,540', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '32,541', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=feature, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '32,541', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,541', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '32,541', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '32,551', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,552', 'INFO', 'plot type', 'feature']\n", - "['2020-07-31 08', '47', '32,696', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,697', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,721', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '32,722', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=parameter, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '32,722', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,722', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '32,722', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '32,731', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,732', 'INFO', 'plot type', 'parameter']\n", - "['2020-07-31 08', '47', '32,740', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,740', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,751', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 08', '47', '32,752', 'INFO', \"interpret_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), plot=summary, feature=None, observation=None)']\n", - "['2020-07-31 08', '47', '32,752', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,946', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,946', 'INFO', 'plot type', 'summary']\n", - "['2020-07-31 08', '47', '32,946', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 08', '47', '33,221', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 08', '47', '33,761', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '33,761', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '33,767', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 08', '47', '33,768', 'INFO', \"interpret_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), plot=correlation, feature=None, observation=None)']\n", - "['2020-07-31 08', '47', '33,768', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '33,769', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '33,769', 'INFO', 'plot type', 'correlation']\n", - "['2020-07-31 08', '47', '33,769', 'WARNING', 'No feature passed. Default value of feature used for correlation plot', 'age']\n", - "['2020-07-31 08', '47', '33,769', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 08', '47', '34,080', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 08', '47', '34,387', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '34,387', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '34,395', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 08', '47', '34,396', 'INFO', \"interpret_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), plot=reason, feature=None, observation=12)']\n", - "['2020-07-31 08', '47', '34,396', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '34,397', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '34,397', 'INFO', 'plot type', 'reason']\n", - "['2020-07-31 08', '47', '34,398', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 08', '47', '34,661', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 08', '47', '34,753', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '34,754', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '34,811', 'INFO', 'Initializing automl()']\n", - "['2020-07-31 08', '47', '34,812', 'INFO', 'automl(optimize=MAE, use_holdout=False)']\n", - "['2020-07-31 08', '47', '34,812', 'INFO', 'Model Selection Basis', 'CV Results on Training set']\n", - "['2020-07-31 08', '47', '34,820', 'INFO', 'SubProcess finalize_model() called ==================================']\n", - "['2020-07-31 08', '47', '34,821', 'INFO', 'Initializing finalize_model()']\n", - "['2020-07-31 08', '47', '34,822', 'INFO', 'finalize_model(estimator=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123))']\n", - "['2020-07-31 08', '47', '34,822', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '34,822', 'INFO', 'Getting model name']\n", - "['2020-07-31 08', '47', '34,823', 'INFO', 'Finalizing AdaBoost Regressor']\n", - "['2020-07-31 08', '47', '34,883', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '47', '34,935', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 08', '47', '34,936', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'create_model(estimator=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '34,953', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '47', '34,954', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '34,954', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '47', '34,954', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '47', '34,955', 'INFO', 'Declaring custom model']\n", - "['2020-07-31 08', '47', '34,956', 'INFO', 'AdaBoost Regressor Imported succesfully']\n", - "['2020-07-31 08', '47', '34,957', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '47', '34,958', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '47', '34,961', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,005', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,008', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,015', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '47', '35,016', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,074', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,078', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,079', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,088', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '47', '35,089', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,141', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,145', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,146', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,153', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '47', '35,154', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,201', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,204', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,204', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,211', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '47', '35,213', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,259', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,262', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,262', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,269', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '47', '35,270', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,312', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,316', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,316', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,322', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '47', '35,324', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,365', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,369', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,375', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '47', '35,376', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,417', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,420', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,420', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,426', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '47', '35,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,468', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,471', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,471', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,477', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '47', '35,478', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,518', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,521', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,521', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,527', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '47', '35,528', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '47', '35,532', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'create_model_container', '23']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'master_model_container', '23']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'display_container', '25']\n", - "['2020-07-31 08', '47', '35,576', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '35,576', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,576', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 08', '47', '35,635', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '35,636', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '35,637', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '47', '35,637', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '35,647', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '35,653', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '47', '35,653', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,653', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '35,712', 'INFO', 'create_model_container', '23']\n", - "['2020-07-31 08', '47', '35,712', 'INFO', 'master_model_container', '23']\n", - "['2020-07-31 08', '47', '35,712', 'INFO', 'display_container', '25']\n", - "['2020-07-31 08', '47', '35,713', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '35,713', 'INFO', 'finalize_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,713', 'INFO', 'SubProcess finalize_model() end ==================================']\n", - "['2020-07-31 08', '47', '35,714', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '35,715', 'INFO', 'automl() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,914', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '35,916', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=best-model, verbose=True)']\n", - "['2020-07-31 08', '47', '35,916', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '35,932', 'INFO', 'best-model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '35,942', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '47', '35,942', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '36,014', 'INFO', 'Initializing deploy_model()']\n", - "['2020-07-31 08', '47', '36,016', 'INFO', 'deploy_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "[\"random_state=123), model_name=best-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", - "['2020-07-31 08', '47', '36,019', 'INFO', 'Platform', 'AWS S3']\n", - "['2020-07-31 08', '47', '36,202', 'INFO', 'Saving model in active working directory']\n", - "['2020-07-31 08', '47', '36,202', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '36,203', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '36,204', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=best-aws, verbose=False)']\n", - "['2020-07-31 08', '47', '36,204', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '36,214', 'INFO', 'best-aws.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', 'Initializing S3 client']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'PyCaret Clustering Module']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'version 2.0']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'USI', '872d']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'setup(data=(224, 21), categorical_features=None, categorical_imputation=constant, ordinal_features=None, high_cardinality_features=None,']\n", - "[\"numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=['Country Name'], normalize=False,\"]\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, group_features=None,']\n", - "['group_names=None, supervised=False, supervised_target=None, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=health1, log_plots=True, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'Checking environment']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Memory', 'svmem(total=17032478720, available=10622828544, percent=37.6, used=6409650176, free=10622828544)']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Checking libraries']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 08', '47', '37,218', 'INFO', 'sklearn==0.23.1']\n", - "['2020-07-31 08', '47', '37,223', 'INFO', 'kmodes==0.10.1']\n", - "['2020-07-31 08', '47', '37,758', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '37,758', 'INFO', 'deploy_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'get_config(variable=X_train)']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'Global variable', 'X_train returned']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,795', 'INFO', 'Initializing set_config()']\n", - "['2020-07-31 08', '47', '37,795', 'INFO', 'set_config(variable=seed, value=999)']\n", - "['2020-07-31 08', '47', '37,795', 'INFO', 'Global variable', 'seed updated']\n", - "['2020-07-31 08', '47', '37,796', 'INFO', 'set_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '38,740', 'INFO', 'mlflow==1.8.0']\n", - "['2020-07-31 08', '47', '38,741', 'INFO', 'Checking Exceptions']\n", - "['2020-07-31 08', '47', '38,741', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '38,741', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '38,760', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '38,761', 'INFO', 'Declaring global variables']\n", - "['2020-07-31 08', '47', '38,761', 'INFO', 'Copying data for preprocessing']\n", - "['2020-07-31 08', '47', '38,767', 'INFO', 'Declaring preprocessing parameters']\n", - "['2020-07-31 08', '47', '38,767', 'INFO', 'Importing preprocessing module']\n", - "['2020-07-31 08', '47', '40,016', 'INFO', 'Creating preprocessing pipeline']\n", - "['2020-07-31 08', '47', '40,955', 'INFO', 'Preprocessing pipeline created successfully']\n", - "['2020-07-31 08', '47', '40,955', 'INFO', 'Creating grid variables']\n", - "['2020-07-31 08', '47', '40,957', 'INFO', 'Creating global containers']\n", - "['2020-07-31 08', '47', '41,398', 'INFO', 'Logging experiment in MLFlow']\n", - "['2020-07-31 08', '47', '41,542', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '41,543', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '41,555', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", - "['2020-07-31 08', '47', '41,555', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '41,565', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '41,580', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False), Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False)]']\n", - "['2020-07-31 08', '47', '41,580', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '41,580', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '41,699', 'INFO', 'Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "['verbose=False)']\n", - "['2020-07-31 08', '47', '41,699', 'INFO', 'setup() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '41,768', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '47', '41,768', 'INFO', 'create_model(model=kmeans, num_clusters=4, ground_truth=None, verbose=True, system=True)']\n", - "['2020-07-31 08', '47', '41,769', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '41,769', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '41,769', 'INFO', 'Setting num_cluster param']\n", - "['2020-07-31 08', '47', '41,769', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '41,790', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 08', '47', '41,790', 'INFO', 'K-Means Clustering Imported succesfully']\n", - "['2020-07-31 08', '47', '41,796', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '41,892', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '41,915', 'INFO', 'Creating Metrics dataframe']\n", - "['2020-07-31 08', '47', '41,917', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '47', '42,047', 'INFO', 'SubProcess plot_model() called ==================================']\n", - "['2020-07-31 08', '47', '42,047', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '42,048', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '42,048', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '42,048', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '43,583', 'INFO', 'plot type', 'cluster']\n", - "['2020-07-31 08', '47', '43,583', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '47', '43,584', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '47', '43,584', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", - "['2020-07-31 08', '47', '43,585', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '43,585', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '43,585', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '47', '43,585', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", - "['2020-07-31 08', '47', '43,585', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '43,602', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '47', '43,603', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '47', '43,603', 'INFO', '(224, 21)']\n", - "['2020-07-31 08', '47', '43,603', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '43,603', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '47', '43,612', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 08', '47', '43,620', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '47', '43,623', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '47', '47,566', 'INFO', \"Saving 'Cluster.html' in current active directory\"]\n", - "['2020-07-31 08', '47', '47,566', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '47,566', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '47,921', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '47,921', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=distribution, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '47,921', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '47,921', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '47,932', 'INFO', 'plot type', 'distribution']\n", - "['2020-07-31 08', '47', '47,932', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '47', '47,932', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '47', '47,933', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=False)']\n", - "['2020-07-31 08', '47', '47,933', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '47,933', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '47,933', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '47', '47,933', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '47,946', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '47', '47,946', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '47', '47,946', 'INFO', '(224, 22)']\n", - "['2020-07-31 08', '47', '47,947', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '47,947', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '47', '47,947', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '47', '47,953', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '47', '48,750', 'INFO', \"Saving 'Distribution.html' in current active directory\"]\n", - "['2020-07-31 08', '47', '48,750', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '48,750', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '49,086', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '49,087', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=elbow, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '49,087', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '49,087', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '49,099', 'INFO', 'plot type', 'elbow']\n", - "['2020-07-31 08', '47', '49,361', 'INFO', 'Fitting KElbowVisualizer()']\n", - "['2020-07-31 08', '47', '49,949', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '47', '50,717', 'INFO', \"Saving 'Elbow.png' in current active directory\"]\n", - "['2020-07-31 08', '47', '50,717', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '50,717', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '50,729', 'INFO', 'SubProcess plot_model() end ==================================']\n", - "['2020-07-31 08', '47', '50,730', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '50,730', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '50,731', 'INFO', \"save_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '47', '50,731', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '50,737', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '50,744', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0)]']\n", - "['2020-07-31 08', '47', '50,744', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '50,744', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '50,783', 'INFO', \"KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0)']\n", - "['2020-07-31 08', '47', '50,784', 'INFO', 'create_models() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '50,796', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '47', '50,796', 'INFO', 'create_model(model=kmodes, num_clusters=4, ground_truth=None, verbose=True, system=True)']\n", - "['2020-07-31 08', '47', '50,796', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '50,797', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '50,797', 'INFO', 'Setting num_cluster param']\n", - "['2020-07-31 08', '47', '50,797', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '50,827', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 08', '47', '50,834', 'INFO', 'K-Modes Clustering Imported succesfully']\n", - "['2020-07-31 08', '47', '50,842', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '52,734', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '52,751', 'INFO', 'Creating Metrics dataframe']\n", - "['2020-07-31 08', '47', '52,753', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '47', '52,890', 'INFO', 'SubProcess plot_model() called ==================================']\n", - "['2020-07-31 08', '47', '52,891', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '52,891', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), plot=cluster, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '52,892', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '52,892', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '52,905', 'INFO', 'plot type', 'cluster']\n", - "['2020-07-31 08', '47', '52,905', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '47', '52,906', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '47', '52,907', 'INFO', \"assign_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), transformation=True, verbose=False)']\n", - "['2020-07-31 08', '47', '52,907', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '52,907', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '52,907', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '47', '52,908', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", - "['2020-07-31 08', '47', '52,908', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '52,926', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '47', '52,927', 'INFO', 'Trained Model', 'K-Modes Clustering']\n", - "['2020-07-31 08', '47', '52,927', 'INFO', '(224, 21)']\n", - "['2020-07-31 08', '47', '52,927', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '52,928', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '47', '52,935', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 08', '47', '52,945', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '47', '52,949', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '47', '53,559', 'INFO', \"Saving 'Cluster.html' in current active directory\"]\n", - "['2020-07-31 08', '47', '53,559', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '53,559', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '53,925', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '53,926', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), plot=distribution, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '53,926', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '53,926', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '53,939', 'INFO', 'plot type', 'distribution']\n", - "['2020-07-31 08', '47', '53,939', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '47', '53,939', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '47', '53,940', 'INFO', \"assign_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), transformation=False, verbose=False)']\n", - "['2020-07-31 08', '47', '53,940', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '53,940', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '53,940', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '47', '53,940', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '53,958', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '47', '53,959', 'INFO', 'Trained Model', 'K-Modes Clustering']\n", - "['2020-07-31 08', '47', '53,959', 'INFO', '(224, 22)']\n", - "['2020-07-31 08', '47', '53,959', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '53,959', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '47', '53,960', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '47', '53,967', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '47', '54,761', 'INFO', \"Saving 'Distribution.html' in current active directory\"]\n", - "['2020-07-31 08', '47', '54,761', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '54,761', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '55,112', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '55,113', 'INFO', \"plot_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), plot=elbow, feature=None, label=False, save=True, system=False)']\n", - "['2020-07-31 08', '47', '55,113', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '55,113', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '55,125', 'INFO', 'plot type', 'elbow']\n", - "['2020-07-31 08', '47', '55,145', 'INFO', 'Fitting KElbowVisualizer()']\n", - "['2020-07-31 08', '48', '00,303', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '00,447', 'INFO', \"Saving 'Elbow.png' in current active directory\"]\n", - "['2020-07-31 08', '48', '00,447', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '00,447', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '00,458', 'INFO', 'SubProcess plot_model() end ==================================']\n", - "['2020-07-31 08', '48', '00,458', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '48', '00,459', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '48', '00,459', 'INFO', \"save_model(model=KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '48', '00,459', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '48', '00,581', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '48', '00,586', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0)]']\n", - "['2020-07-31 08', '48', '00,587', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '00,587', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '48', '00,619', 'INFO', \"KModes(cat_dissim=, init='Cao',\"]\n", - "['max_iter=100, n_clusters=4, n_init=1, n_jobs=-1, random_state=123,']\n", - "['verbose=0)']\n", - "['2020-07-31 08', '48', '00,619', 'INFO', 'create_models() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '03,231', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '48', '03,231', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=True)']\n", - "['2020-07-31 08', '48', '03,232', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '03,232', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '48', '03,232', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '48', '03,232', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '48', '03,262', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '48', '03,262', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '48', '03,263', 'INFO', '(224, 22)']\n", - "['2020-07-31 08', '48', '03,264', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '04,898', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '04,898', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '04,899', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '04,899', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '04,909', 'INFO', 'plot type', 'cluster']\n", - "['2020-07-31 08', '48', '04,909', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '48', '04,909', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '48', '04,910', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", - "['2020-07-31 08', '48', '04,910', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '04,910', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '48', '04,910', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '48', '04,911', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", - "['2020-07-31 08', '48', '04,911', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '48', '04,927', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '48', '04,927', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '48', '04,927', 'INFO', '(224, 21)']\n", - "['2020-07-31 08', '48', '04,927', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '04,928', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '48', '04,931', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 08', '48', '04,936', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '48', '04,938', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '05,369', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '05,369', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '07,179', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '07,180', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=cluster, feature=Country Name, label=True, save=False, system=True)']\n", - "['2020-07-31 08', '48', '07,180', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '07,180', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '07,187', 'INFO', 'plot type', 'cluster']\n", - "['2020-07-31 08', '48', '07,187', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '48', '07,188', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '48', '07,188', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", - "['2020-07-31 08', '48', '07,188', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '07,189', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '48', '07,189', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '48', '07,189', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", - "['2020-07-31 08', '48', '07,189', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '48', '07,199', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '48', '07,200', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '48', '07,200', 'INFO', '(224, 21)']\n", - "['2020-07-31 08', '48', '07,200', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '07,200', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '48', '07,204', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 08', '48', '07,207', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '48', '07,209', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '07,466', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '07,466', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '08,323', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '08,324', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=tsne, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '08,324', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '08,324', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '08,334', 'INFO', 'plot type', 'tsne']\n", - "['2020-07-31 08', '48', '08,334', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '48', '08,334', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=True, verbose=False)']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', 'Transformation param set to True. Assigned clusters are attached on transformed dataset.']\n", - "['2020-07-31 08', '48', '08,335', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '48', '08,343', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '48', '08,344', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '48', '08,344', 'INFO', '(224, 21)']\n", - "['2020-07-31 08', '48', '08,344', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '08,344', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '48', '08,345', 'INFO', 'Fitting TSNE()']\n", - "['2020-07-31 08', '48', '10,591', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '48', '10,600', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '11,151', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '11,151', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '11,158', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '11,159', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=elbow, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '11,159', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '11,159', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '11,168', 'INFO', 'plot type', 'elbow']\n", - "['2020-07-31 08', '48', '11,169', 'INFO', 'Fitting KElbowVisualizer()']\n", - "['2020-07-31 08', '48', '11,704', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '11,875', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '11,875', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '11,882', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '11,883', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=silhouette, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '11,883', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '11,883', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '11,893', 'INFO', 'plot type', 'silhouette']\n", - "['2020-07-31 08', '48', '11,893', 'INFO', 'Fitting SilhouetteVisualizer()']\n", - "['2020-07-31 08', '48', '11,976', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '12,124', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '12,124', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '12,130', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '12,131', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=distance, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '12,131', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '12,132', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '12,142', 'INFO', 'plot type', 'distance']\n", - "['2020-07-31 08', '48', '12,163', 'INFO', 'Fitting InterclusterDistance()']\n", - "['2020-07-31 08', '48', '12,187', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '12,317', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '12,317', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '12,325', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '48', '12,325', 'INFO', \"plot_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), plot=distribution, feature=None, label=False, save=False, system=True)']\n", - "['2020-07-31 08', '48', '12,325', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '12,325', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '48', '12,334', 'INFO', 'plot type', 'distribution']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '48', '12,335', 'INFO', 'SubProcess assign_model() called ==================================']\n", - "['2020-07-31 08', '48', '12,335', 'INFO', 'Initializing assign_model()']\n", - "['2020-07-31 08', '48', '12,336', 'INFO', \"assign_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), transformation=False, verbose=False)']\n", - "['2020-07-31 08', '48', '12,336', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '48', '12,336', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '48', '12,336', 'INFO', 'Copying data']\n", - "['2020-07-31 08', '48', '12,336', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', 'Determining Trained Model']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', 'Trained Model', 'K-Means Clustering']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', '(224, 22)']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', 'assign_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', 'SubProcess assign_model() end ==================================']\n", - "['2020-07-31 08', '48', '12,347', 'INFO', 'Sorting dataframe']\n", - "['2020-07-31 08', '48', '12,351', 'INFO', 'Rendering Visual']\n", - "['2020-07-31 08', '48', '12,781', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '48', '12,781', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '16,227', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '48', '16,228', 'INFO', \"save_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), model_name=kmeans, verbose=True)']\n", - "['2020-07-31 08', '48', '16,228', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '48', '16,239', 'INFO', 'kmeans.pkl saved in current working directory']\n", - "['2020-07-31 08', '48', '16,246', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0)]']\n", - "['2020-07-31 08', '48', '16,246', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '19,081', 'INFO', 'Initializing deploy_model()']\n", - "['2020-07-31 08', '48', '19,081', 'INFO', \"deploy_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "[\"random_state=123, tol=0.0001, verbose=0), model_name=kmeans-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", - "['2020-07-31 08', '48', '19,081', 'INFO', 'Platform', 'AWS S3']\n", - "['2020-07-31 08', '48', '19,264', 'INFO', 'Saving model in current working directory']\n", - "['2020-07-31 08', '48', '19,265', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '48', '19,265', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '48', '19,265', 'INFO', \"save_model(model=KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0), model_name=kmeans-aws, verbose=False)']\n", - "['2020-07-31 08', '48', '19,265', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '48', '19,269', 'INFO', 'kmeans-aws.pkl saved in current working directory']\n", - "['2020-07-31 08', '48', '19,273', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True,']\n", - "[\"features_todrop=['Country Name'],\"]\n", - "[\"ml_usecase='regression',\"]\n", - "['numerical_features=[],']\n", - "[\"target='dummy_target',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_...']\n", - "[\"target='dummy_target')),\"]\n", - "[\"('feature_time',\"]\n", - "['Make_Time_Features(list_of_features=None, time_feature=[])),']\n", - "[\"('group', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('binn', Empty()),\"]\n", - "[\"('fix_perfect', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('dummy', Dummify(target='dummy_target')),\"]\n", - "[\"('clean_names', Clean_Colum_Names()), ('fix_multi', Empty()),\"]\n", - "[\"('pca', Empty())],\"]\n", - "[\"verbose=False), KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0)]']\n", - "['2020-07-31 08', '48', '19,273', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '19,273', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '48', '19,273', 'INFO', 'Initializing S3 client']\n", - "['2020-07-31 08', '48', '20,241', 'INFO', \"KMeans(algorithm='auto', copy_x=True, init='k-means++', max_iter=300,\"]\n", - "[\"n_clusters=4, n_init=10, n_jobs=-1, precompute_distances='deprecated',\"]\n", - "['random_state=123, tol=0.0001, verbose=0)']\n", - "['2020-07-31 08', '48', '20,242', 'INFO', 'deploy_model() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '20,588', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '48', '20,588', 'INFO', 'get_config(variable=X)']\n", - "['2020-07-31 08', '48', '20,589', 'INFO', 'Global variable', 'X returned']\n", - "['2020-07-31 08', '48', '20,589', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '21,288', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '48', '21,288', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '48', '21,288', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '48', '21,289', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '21,687', 'INFO', 'Initializing set_config()']\n", - "['2020-07-31 08', '48', '21,687', 'INFO', 'set_config(variable=seed, value=999)']\n", - "['2020-07-31 08', '48', '21,687', 'INFO', 'Global variable', 'seed updated']\n", - "['2020-07-31 08', '48', '21,687', 'INFO', 'set_config() succesfully completed......................................']\n", - "['2020-07-31 08', '48', '22,013', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '48', '22,013', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '48', '22,013', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '48', '22,013', 'INFO', 'get_config() succesfully completed......................................']\n" - ] - } - ], - "source": [ - "get_system_logs()" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# 11. MLFlow UI" + "# 10. MLFlow UI" ] }, { diff --git a/examples/PyCaret 2 Regression.ipynb b/examples/PyCaret 2 Regression.ipynb index 7ff5fd8f8097a8a4fad8d1282ce3c06f1ae2de56..c613a52a7ee3440e81ed1d119b7c3c5c77e08e26 100644 --- a/examples/PyCaret 2 Regression.ipynb +++ b/examples/PyCaret 2 Regression.ipynb @@ -3456,9103 +3456,7 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "# 16. Get System Logs" - ] - }, - { - "cell_type": "code", - "execution_count": 35, - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '40', '51,509', 'INFO', 'PyCaret Classification Module']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'version 2.0']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 01', '40', '51,509', 'INFO', 'USI', '1cda']\n", - "['2020-07-31 01', '40', '51,510', 'INFO', 'setup(data=(1070, 19), target=Purchase, train_size=0.7, sampling=True, sample_estimator=None, categorical_features=None, categorical_imputation=constant, ordinal_features=None,']\n", - "['high_cardinality_features=None, high_cardinality_method=frequency, numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None, remove_outliers=False, outliers_threshold=0.05,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, remove_perfect_collinearity=False, create_clusters=False, cluster_iter=20,']\n", - "['polynomial_features=False, polynomial_degree=2, trigonometry_features=False, polynomial_threshold=0.1, group_features=None,']\n", - "['group_names=None, feature_selection=False, feature_selection_threshold=0.8, feature_interaction=False, feature_ratio=False, interaction_threshold=0.01,']\n", - "['fix_imbalance=False, fix_imbalance_method=None, data_split_shuffle=True, folds_shuffle=False, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=juice1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 01', '40', '51,526', 'INFO', 'Checking environment']\n", - "['2020-07-31 01', '40', '51,526', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 01', '40', '51,527', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Memory', 'svmem(total=17032478720, available=12121403392, percent=28.8, used=4911075328, free=12121403392)']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'Checking libraries']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 01', '40', '51,599', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 01', '40', '55,335', 'INFO', 'sklearn==0.23.1']\n", - "['2020-07-31 01', '40', '55,728', 'INFO', 'xgboost==0.90']\n", - "['2020-07-31 01', '40', '56,084', 'INFO', 'lightgbm==2.3.1']\n", - "['2020-07-31 01', '40', '56,736', 'INFO', 'catboost==0.20.2']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'mlflow==1.8.0']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Checking Exceptions']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '41', '00,681', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '41', '00,697', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '41', '10,136', 'INFO', 'Copying data for preprocessing']\n", - "['2020-07-31 01', '41', '10,136', 'INFO', 'Declaring global variables']\n", - "['2020-07-31 01', '41', '10,162', 'INFO', 'Declaring preprocessing parameters']\n", - "['2020-07-31 01', '41', '10,162', 'INFO', 'Importing preprocessing module']\n", - "['2020-07-31 01', '41', '14,303', 'INFO', 'Creating preprocessing pipeline']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Preprocessing pipeline created successfully']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Creating grid variables']\n", - "['2020-07-31 01', '41', '16,174', 'INFO', 'Creating global containers']\n", - "['2020-07-31 01', '41', '16,270', 'INFO', 'Logging experiment in MLFlow']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", - "['2020-07-31 01', '41', '16,394', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False)]']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '16,409', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'create_model_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'master_model_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'display_container 0']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['verbose=False)']\n", - "['2020-07-31 01', '41', '16,487', 'INFO', 'setup() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'compare_models(blacklist=None, whitelist=None, fold=10, round=4, sort=Accuracy, n_select=1, turbo=True, verbose=True)']\n", - "['2020-07-31 01', '41', '23,818', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '41', '23,820', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '41', '23,820', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '41', '23,838', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '41', '23,839', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '41', '23,910', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 01', '41', '23,922', 'INFO', 'Import successful']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '41', '23,928', 'INFO', 'Initializing Logistic Regression']\n", - "['2020-07-31 01', '41', '23,934', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '23,940', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '23,996', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,003', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,007', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '24,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,057', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,064', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,068', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '24,073', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,111', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,118', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,122', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '24,127', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,168', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,174', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,178', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '24,182', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,224', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,230', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,235', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '24,240', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,279', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,286', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,290', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '24,296', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,338', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,345', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,349', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '24,354', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,391', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,398', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,402', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '24,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,447', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,453', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,457', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '24,462', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,503', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,514', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '24,514', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '24,523', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'save_model(model=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '24,580', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '24,644', 'INFO', 'Initializing K Neighbors Classifier']\n", - "['2020-07-31 01', '41', '24,647', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '24,647', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,685', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '24,905', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '24,911', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '24,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '24,922', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,165', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,173', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '25,180', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,185', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,410', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,415', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '25,422', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,427', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,652', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,652', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '25,672', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,676', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '25,941', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '25,956', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '25,956', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '25,972', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,219', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,235', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '26,235', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,249', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,490', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,490', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '26,510', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,514', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '26,744', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '26,750', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '26,756', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '26,760', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '26,998', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,007', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,019', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,243', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,248', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '27,249', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '27,259', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '27,319', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '27,319', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '27,320', 'INFO', \"save_model(model=KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '27,320', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '27,330', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '27,338', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), KNeighborsClassifier(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform')]\"]\n", - "['2020-07-31 01', '41', '27,338', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '27,338', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '27,380', 'INFO', 'Initializing Naive Bayes']\n", - "['2020-07-31 01', '41', '27,380', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '27,396', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,398', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,405', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,410', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '27,415', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,418', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,424', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,429', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '27,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,437', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,444', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,449', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '27,455', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,458', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,465', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,469', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '27,475', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,484', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,489', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '27,494', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,504', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,509', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '27,514', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,517', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,525', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,530', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '27,535', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,538', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,545', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,550', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '27,556', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,559', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,566', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,570', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,576', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,585', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,590', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '27,590', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '27,600', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'save_model(model=GaussianNB(priors=None, var_smoothing=1e-09), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), GaussianNB(priors=None, var_smoothing=1e-09)]']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '27,648', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '27,707', 'INFO', 'Initializing Decision Tree Classifier']\n", - "['2020-07-31 01', '41', '27,712', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '27,718', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,766', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,778', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '27,783', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,794', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,799', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '27,806', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,811', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,817', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,825', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '27,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,847', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,853', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '27,860', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,866', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,873', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '27,879', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '27,886', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,891', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,899', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,904', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '27,912', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,917', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,926', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,931', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '27,938', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,944', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,951', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,957', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '27,962', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,967', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '27,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '27,982', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '27,987', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '27,993', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,000', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,006', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,006', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,017', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,076', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,076', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,077', 'INFO', \"save_model(model=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '28,077', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,082', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,086', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')]\"]\n", - "['2020-07-31 01', '41', '28,087', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,087', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,135', 'INFO', 'Initializing SVM - Linear Kernel']\n", - "['2020-07-31 01', '41', '28,141', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '28,147', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,188', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,188', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,191', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,193', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,198', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '28,204', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,212', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,215', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,217', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,222', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '28,227', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,235', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,235', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,238', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,240', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,245', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '28,250', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,256', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,256', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,259', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,262', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,266', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '28,272', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,276', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,279', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,281', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,286', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '28,291', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,297', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,297', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,300', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,302', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,307', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '28,312', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,319', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,319', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,322', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,324', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,329', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '28,334', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,341', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,341', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,344', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,346', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,350', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '28,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,364', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,364', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,367', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,374', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '28,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,386', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '28,386', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,389', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,391', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,396', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,396', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,407', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,473', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'save_model(model=SGDClassifier(alpha=0.0001, average=False, class_weight=None,']\n", - "['early_stopping=False, epsilon=0.1, eta0=0.0, fit_intercept=True,']\n", - "[\"l1_ratio=0.15, learning_rate='optimal', loss='hinge',\"]\n", - "[\"max_iter=1000, n_iter_no_change=5, n_jobs=-1, penalty='l2',\"]\n", - "['power_t=0.5, random_state=123, shuffle=True, tol=0.001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '28,474', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,479', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), SGDClassifier(alpha=0.0001, average=False, class_weight=None,']\n", - "['early_stopping=False, epsilon=0.1, eta0=0.0, fit_intercept=True,']\n", - "[\"l1_ratio=0.15, learning_rate='optimal', loss='hinge',\"]\n", - "[\"max_iter=1000, n_iter_no_change=5, n_jobs=-1, penalty='l2',\"]\n", - "['power_t=0.5, random_state=123, shuffle=True, tol=0.001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False)]']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,483', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,532', 'INFO', 'Initializing Ridge Classifier']\n", - "['2020-07-31 01', '41', '28,532', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '28,547', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,630', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,630', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,646', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '28,646', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,662', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,662', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,665', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,667', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,676', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '28,683', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,687', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,687', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,690', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,692', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,697', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '28,706', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,711', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,711', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,713', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,715', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,720', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '28,726', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,730', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,730', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,733', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,735', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,739', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '28,744', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,748', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,749', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,751', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,754', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,759', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '28,764', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,768', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,768', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,771', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,778', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '28,784', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,788', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,791', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,793', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,799', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '28,804', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,809', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,809', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,813', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,816', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,821', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '28,827', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '28,831', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '28,831', 'WARNING', 'model has no predict_proba attribute. pred_prob set to 0.00']\n", - "['2020-07-31 01', '41', '28,834', 'WARNING', 'model has no predict_proba attribute. AUC set to 0.00']\n", - "['2020-07-31 01', '41', '28,836', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '28,841', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '28,841', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '28,853', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '28,934', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '28,935', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '28,935', 'INFO', 'save_model(model=RidgeClassifier(alpha=1.0, class_weight=None, copy_X=True, fit_intercept=True,']\n", - "[\"max_iter=None, normalize=False, random_state=123, solver='auto',\"]\n", - "['tol=0.001), model_name=Trained Model, verbose=False)']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '28,935', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '28,940', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RidgeClassifier(alpha=1.0, class_weight=None, copy_X=True, fit_intercept=True,']\n", - "[\"max_iter=None, normalize=False, random_state=123, solver='auto',\"]\n", - "['tol=0.001)]']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '28,944', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '28,994', 'INFO', 'Initializing Random Forest Classifier']\n", - "['2020-07-31 01', '41', '29,000', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '29,006', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,127', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '29,363', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '29,378', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '29,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,496', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '29,712', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '29,716', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '29,723', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '29,834', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,077', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,087', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '30,095', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,207', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,439', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,448', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '30,455', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,569', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '30,799', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '30,799', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '30,814', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '30,933', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,175', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '31,183', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '31,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,538', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,547', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '31,553', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '31,666', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '31,902', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '31,913', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '31,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,034', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '32,263', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,387', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,626', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,630', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '32,630', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '32,642', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '32,713', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '32,729', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '32,760', 'INFO', 'Initializing Quadratic Discriminant Analysis']\n", - "['2020-07-31 01', '41', '32,776', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '32,776', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,838', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,838', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,854', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '32,870', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,885', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,901', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,916', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '32,932', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,948', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '32,948', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,948', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,963', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '32,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '32,995', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '32,995', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '33,010', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,010', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,023', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,029', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '33,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,039', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,045', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,050', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '33,050', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '33,062', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'save_model(model=QuadraticDiscriminantAnalysis(priors=None, reg_param=0.0,']\n", - "['store_covariance=False, tol=0.0001), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), QuadraticDiscriminantAnalysis(priors=None, reg_param=0.0,']\n", - "['store_covariance=False, tol=0.0001)]']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '33,114', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '33,161', 'INFO', 'Initializing Ada Boost Classifier']\n", - "['2020-07-31 01', '41', '33,161', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '33,177', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,239', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,255', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,255', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '33,270', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,333', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,348', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,348', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '33,364', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,427', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,442', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,442', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '33,458', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,520', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,536', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,552', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '33,552', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,614', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,649', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,655', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '33,660', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,730', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,746', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,761', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '33,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,839', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,855', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,855', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '33,871', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '33,933', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '33,949', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '33,964', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '33,964', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,027', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '34,058', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,136', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '34,152', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '34,171', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '34,240', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '34,241', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123)]']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '34,250', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '34,314', 'INFO', 'Initializing Gradient Boosting Classifier']\n", - "['2020-07-31 01', '41', '34,322', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '34,328', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,447', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,455', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,460', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '34,466', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,582', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '34,589', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,594', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '34,600', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,726', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,733', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,739', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '34,745', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,851', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '34,868', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '34,872', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '34,877', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '34,995', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,002', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,008', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '35,013', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,134', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,142', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,146', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '35,151', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,277', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,284', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,290', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '35,296', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,398', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,398', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,413', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '35,413', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,532', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,539', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,545', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '35,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,674', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,680', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,686', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '35,686', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '35,699', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', \"save_model(model=GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '35,767', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '35,814', 'INFO', 'Initializing Linear Discriminant Analysis']\n", - "['2020-07-31 01', '41', '35,832', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '35,838', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,848', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,855', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,860', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '35,865', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,873', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,880', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,885', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '35,890', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,900', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,906', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,911', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '35,916', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,924', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,931', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,936', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '35,941', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,949', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,956', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,960', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '35,966', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,973', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '35,980', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '35,985', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '35,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '35,999', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,005', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,013', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '36,021', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,031', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,037', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,043', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '36,048', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,055', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,062', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,066', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '36,071', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,079', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,086', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,091', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '36,091', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '36,103', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '36,160', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '36,160', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '36,161', 'INFO', 'save_model(model=LinearDiscriminantAnalysis(n_components=None, priors=None, shrinkage=None,']\n", - "[\"solver='svd', store_covariance=False, tol=0.0001), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '41', '36,161', 'INFO', 'Appending prep pipeline']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '36,165', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '36,168', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LinearDiscriminantAnalysis(n_components=None, priors=None, shrinkage=None,']\n", - "[\"solver='svd', store_covariance=False, tol=0.0001)]\"]\n", - "['2020-07-31 01', '41', '36,168', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '36,168', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '36,199', 'INFO', 'Initializing Extra Trees Classifier']\n", - "['2020-07-31 01', '41', '36,215', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '36,221', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,359', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,592', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,602', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '36,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '36,759', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '36,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '36,983', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '36,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,131', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '37,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '37,369', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '37,390', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,529', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '37,769', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '37,769', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '37,792', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '37,934', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,165', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,181', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '38,181', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '38,333', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,572', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,572', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '38,588', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '38,732', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '38,984', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '38,994', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '39,003', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,164', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '39,413', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '39,419', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '39,419', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,586', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '39,808', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '39,808', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '39,823', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '39,966', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '40,196', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '40,211', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'save_model(model=ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '40,302', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '40,333', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '40,349', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '40,395', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 01', '41', '40,395', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '40,410', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,501', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,532', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '40,537', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,584', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,603', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '40,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,655', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,667', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,678', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '40,687', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,727', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,740', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,751', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '40,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,800', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,813', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,820', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '40,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,873', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,886', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,897', 'INFO', 'Initializing Fold 7']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '41', '40,906', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '40,946', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '40,959', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '40,970', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '40,980', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,020', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,032', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,043', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '41,054', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,096', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,109', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,119', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '41,128', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,175', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,188', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,199', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '41,199', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '41,228', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '41,348', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', \"save_model(model=XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '41,349', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '41,358', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)]']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '41,362', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '41,423', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 01', '41', '41,429', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '41,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,515', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,533', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,544', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '41,554', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,628', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,645', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,656', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '41,665', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,734', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,737', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,753', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '41,769', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,837', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,838', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,853', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '41,873', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '41,936', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '41,937', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '41,953', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '41,972', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,047', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,063', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,074', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '42,084', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,180', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,196', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,208', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '42,218', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,287', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,302', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,318', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '42,318', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,380', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,412', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,412', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '42,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '42,502', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '42,519', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '42,530', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '41', '42,531', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '41', '42,561', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '41', '42,651', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '41', '42,651', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '41', '42,652', 'INFO', \"save_model(model=LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '41', '42,652', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '41', '42,663', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '41', '42,675', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '41', '42,777', 'INFO', 'Initializing CatBoost Classifier']\n", - "['2020-07-31 01', '41', '42,783', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '41', '42,789', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '45,155', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '45,194', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '45,199', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '41', '45,205', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '47,070', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '41', '47,086', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '48,735', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '48,751', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '48,751', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '41', '48,764', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '50,511', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '50,526', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '50,542', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '41', '50,542', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '52,170', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '52,170', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '52,186', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '41', '52,193', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '53,805', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '53,820', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '53,820', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '41', '53,834', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '55,391', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '55,391', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '55,407', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '41', '55,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '56,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '56,994', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '56,994', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '41', '57,008', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '41', '58,639', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '41', '58,654', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '41', '58,670', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '41', '58,670', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,228', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '00,244', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '00,260', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '00,317', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '00,317', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '00,318', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '00,318', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '00,325', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ]']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '00,329', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '00,375', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 01', '42', '00,375', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'create_model(estimator=lr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '00,383', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '00,391', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '00,392', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '00,395', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '00,396', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,435', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,441', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,445', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '00,445', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,476', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,476', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,492', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '00,492', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,523', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '00,539', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,585', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,585', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,601', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '00,601', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,632', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '00,648', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,679', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '00,695', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '00,742', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '00,788', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '00,788', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '00,835', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '00,882', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '00,882', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '00,898', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'display_container', '1']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '00,929', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '00,999', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 01', '42', '00,999', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'display_container', '2']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '01,000', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'create_model(estimator=lr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '01,009', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '01,010', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '01,033', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '01,034', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '01,035', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '01,035', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '01,039', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '01,039', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '01,040', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '01,046', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '01,050', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,094', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,101', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,113', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '01,118', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,160', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,166', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,180', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '01,185', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,230', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,236', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,248', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '01,253', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,301', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,314', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '01,322', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,368', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,374', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,378', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '01,378', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,432', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,438', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,444', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '01,444', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,503', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,511', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '01,511', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,561', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,568', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,582', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '01,587', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,626', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,633', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,646', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '01,651', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '01,694', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '01,700', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '01,715', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '01,716', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '01,724', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '01,766', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '01,930', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'save_model(model=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '01,931', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '01,936', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '01,940', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '01,960', 'INFO', 'Uploading results into container']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '01,960', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'create_model_container', '2']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'master_model_container', '2']\n", - "['2020-07-31 01', '42', '01,993', 'INFO', 'display_container', '3']\n", - "['2020-07-31 01', '42', '01,994', 'INFO', 'LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '01,994', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,000', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '02,000', 'INFO', 'create_model(estimator=dt, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '02,001', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '02,022', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '02,023', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '02,027', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '02,027', 'INFO', 'Decision Tree Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '02,028', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '02,035', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '02,040', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,046', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,054', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,069', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '02,073', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,078', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,085', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,099', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '02,104', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,108', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,115', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,133', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '02,137', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,143', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,149', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,165', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '02,170', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,174', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,198', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '02,204', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,208', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,216', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,234', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '02,239', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,244', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,252', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,268', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '02,273', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,279', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,290', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,307', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '02,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,326', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,342', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '02,347', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,352', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '02,360', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '02,376', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '02,377', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '02,385', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '02,390', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '02,521', 'INFO', \"save_model(model=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '42', '02,521', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '02,526', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '02,530', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')]\"]\n", - "['2020-07-31 01', '42', '02,530', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,530', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '02,545', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '02,545', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'create_model_container', '3']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'master_model_container', '3']\n", - "['2020-07-31 01', '42', '02,583', 'INFO', 'display_container', '4']\n", - "['2020-07-31 01', '42', '02,584', 'INFO', \"DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')\"]\n", - "['2020-07-31 01', '42', '02,584', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'create_model(estimator=rf, ensemble=False, method=None, fold=5, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '02,591', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '02,592', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '02,592', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '02,613', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '02,614', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '02,615', 'INFO', 'Defining folds']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '02,615', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '02,619', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '02,620', 'INFO', 'Random Forest Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '02,620', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '02,626', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '02,631', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '02,758', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,028', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '03,034', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,159', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,378', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,408', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '03,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,526', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '03,754', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '03,773', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '03,778', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '03,894', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '04,129', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '04,146', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '04,146', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '04,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '04,495', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '04,517', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '04,518', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '04,524', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '04,642', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '05,033', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '05,049', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '05,065', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '05,065', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'create_model_container', '4']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'master_model_container', '4']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'display_container', '5']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '05,080', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '05,131', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 01', '42', '05,131', 'INFO', \"compare_models(blacklist=None, whitelist=['rf', 'ada', 'gbc', 'et', 'xgboost', 'lightgbm', 'catboost'], fold=3, round=4, sort=Accuracy, n_select=1, turbo=True, verbose=True)\"]\n", - "['2020-07-31 01', '42', '05,131', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '05,132', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '05,132', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '05,155', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '05,156', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '05,160', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 01', '42', '05,160', 'INFO', 'Import successful']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '05,167', 'INFO', 'Initializing Random Forest Classifier']\n", - "['2020-07-31 01', '42', '05,172', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '05,179', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '05,293', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '05,535', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '05,535', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '05,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '05,676', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '05,894', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '05,894', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '05,910', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,026', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '06,258', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '06,273', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '06,339', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '06,339', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '06,340', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '06,340', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '06,346', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '06,400', 'INFO', 'Initializing Ada Boost Classifier']\n", - "['2020-07-31 01', '42', '06,405', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '06,411', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '06,496', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,575', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,581', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,596', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '06,596', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,670', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '06,680', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '06,696', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '06,760', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R', base_estimator=None, learning_rate=1.0,\"]\n", - "['n_estimators=50, random_state=123)]']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '06,779', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '06,825', 'INFO', 'Initializing Gradient Boosting Classifier']\n", - "['2020-07-31 01', '42', '06,825', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '06,841', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '06,929', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '06,929', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '06,944', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '06,944', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,030', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '07,046', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,146', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '07,162', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '07,241', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '07,241', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '07,242', 'INFO', \"save_model(model=GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '07,242', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '07,249', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingClassifier(ccp_alpha=0.0, criterion='friedman_mse', init=None,\"]\n", - "[\"learning_rate=0.1, loss='deviance', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '07,254', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '07,294', 'INFO', 'Initializing Extra Trees Classifier']\n", - "['2020-07-31 01', '42', '07,294', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '07,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '07,694', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '07,694', 'INFO', 'Initializing Fold 2']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '07,694', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '07,859', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '08,109', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,277', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '08,495', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '08,511', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'save_model(model=ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '08,611', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ExtraTreesClassifier(bootstrap=False, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '08,658', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '08,705', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 01', '42', '08,721', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '08,727', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,759', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,773', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,781', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '08,794', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,828', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,842', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,853', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '08,864', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '08,900', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '08,913', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '08,924', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '08,925', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '08,947', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', \"save_model(model=XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '09,139', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)]']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '09,154', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '09,201', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 01', '42', '09,216', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '09,222', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,276', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,282', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,297', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '09,314', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,375', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,381', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,397', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '09,413', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '09,466', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '09,481', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '09,514', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', \"save_model(model=LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '09,597', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '09,613', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMClassifier(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '09,628', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '09,722', 'INFO', 'Initializing CatBoost Classifier']\n", - "['2020-07-31 01', '42', '09,733', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '09,738', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '11,485', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '11,485', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '11,501', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '11,508', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '13,655', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '13,671', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '13,671', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '13,686', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '15,832', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '15,844', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '15,851', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '15,851', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '15,867', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '15,935', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '15,936', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '15,944', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ]']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '15,950', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '16,009', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 01', '42', '16,009', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'create_model(estimator=xgboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '16,014', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '16,024', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '16,024', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '16,025', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '16,026', 'INFO', 'Extreme Gradient Boosting Imported succesfully']\n", - "['2020-07-31 01', '42', '16,027', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '16,030', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '16,031', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,079', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,084', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,099', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '16,099', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,177', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '16,177', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,224', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,240', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,256', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '16,271', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,334', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,349', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '16,349', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,396', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,412', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,427', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '16,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,474', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,490', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,505', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '16,521', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,584', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,599', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '16,599', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,646', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,662', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,677', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '16,693', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,740', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,755', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '16,771', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '16,771', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '16,834', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '16,849', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '16,865', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '16,865', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '16,880', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 01', '42', '16,927', 'INFO', 'display_container', '6']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', \"XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '16,943', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'display_container', '7']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', \"XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "['learning_rate=0.1, max_delta_step=0, max_depth=3,']\n", - "['min_child_weight=1, missing=None, n_estimators=100, n_jobs=-1,']\n", - "[\"nthread=None, objective='binary\", \"logistic', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 01', '42', '17,034', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '17,048', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 01', '42', '17,049', 'INFO', 'tune_model(estimator=LogisticRegression(C=1.0, class_weight=None, dual=False, fit_intercept=True,']\n", - "['intercept_scaling=1, l1_ratio=None, max_iter=100,']\n", - "[\"multi_class='auto', n_jobs=None, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), fold=10, round=4, n_iter=10, custom_grid=None, optimize=Accuracy, choose_better=False, verbose=True)']\n", - "['2020-07-31 01', '42', '17,049', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '17,051', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '17,051', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '17,077', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '17,078', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '17,078', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '17,079', 'INFO', 'Base model', 'Logistic Regression']\n", - "['2020-07-31 01', '42', '17,080', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '17,080', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '17,088', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 01', '42', '17,088', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 01', '42', '20,205', 'INFO', 'Random search completed']\n", - "['2020-07-31 01', '42', '20,213', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '20,220', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,253', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,261', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,282', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '20,289', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,320', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,328', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,347', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '20,354', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,386', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,394', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,414', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '20,420', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,451', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,460', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,478', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '20,484', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,516', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,525', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,543', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '20,549', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,589', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,609', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '20,615', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,651', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,661', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,683', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '20,689', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,723', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,732', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,756', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '20,762', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,796', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,805', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,825', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '20,832', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '20,863', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '20,872', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '20,894', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '20,895', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '20,904', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '20,934', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '20,934', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '20,935', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '21,014', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '21,015', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '21,018', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'create_model_container', '6']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'master_model_container', '6']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'display_container', '8']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '21,237', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '21,242', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 01', '42', '21,243', 'INFO', 'tune_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), fold=10, round=4, n_iter=10, custom_grid=None, optimize=Accuracy, choose_better=False, verbose=True)']\n", - "['2020-07-31 01', '42', '21,243', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '21,244', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '21,244', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '21,264', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '21,265', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '21,265', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Base model', 'Random Forest Classifier']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '21,266', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '21,272', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 01', '42', '21,272', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 01', '42', '22,790', 'INFO', 'Random search completed']\n", - "['2020-07-31 01', '42', '22,816', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '22,831', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '22,955', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,185', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,211', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '23,217', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '23,340', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,563', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,582', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '23,586', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '23,716', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '23,951', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '23,968', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '23,974', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,091', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '24,320', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '24,351', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '24,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,483', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '24,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '24,742', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '24,747', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '24,866', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,117', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,141', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '25,146', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '25,283', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,518', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,542', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '25,547', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '25,666', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '25,919', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '25,938', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '25,938', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '26,084', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '26,312', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '26,334', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '26,338', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '26,457', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '26,677', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '26,699', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '26,700', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '26,707', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '26,829', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '26,830', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '26,830', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '26,911', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '26,911', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '26,912', 'INFO', 'save_model(model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '26,912', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '26,927', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '26,931', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'create_model_container', '7']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'master_model_container', '7']\n", - "['2020-07-31 01', '42', '27,309', 'INFO', 'display_container', '9']\n", - "['2020-07-31 01', '42', '27,310', 'INFO', 'RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '27,310', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '27,315', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', \"ensemble_model(estimator=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Bagging, fold=10, n_estimators=10, round=4, choose_better=False, optimize=Accuracy, verbose=True)\"]\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '27,316', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '27,335', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '27,335', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '27,336', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '27,337', 'INFO', 'Base model', 'Decision Tree Classifier']\n", - "['2020-07-31 01', '42', '27,341', 'INFO', 'Importing untrained ensembler']\n", - "['2020-07-31 01', '42', '27,342', 'INFO', 'BaggingClassifier() succesfully imported']\n", - "['2020-07-31 01', '42', '27,347', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '27,347', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '27,349', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '27,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,384', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,416', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,430', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '27,435', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,487', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,504', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '27,509', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,534', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,567', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,582', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '27,587', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,612', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,644', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,658', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '27,663', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,686', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,733', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '27,738', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,764', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,799', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,816', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '27,822', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,852', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,892', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,904', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '27,904', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '27,938', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '27,970', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '27,985', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '27,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,015', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,047', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,062', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '28,067', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,139', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '28,140', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '28,150', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '28,173', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '28,173', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '28,174', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '28,239', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '28,239', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '28,240', 'INFO', 'save_model(model=BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '28,240', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '28,250', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)]']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '28,256', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '28,419', 'INFO', 'create_model_container', '8']\n", - "['2020-07-31 01', '42', '28,420', 'INFO', 'master_model_container', '8']\n", - "['2020-07-31 01', '42', '28,420', 'INFO', 'display_container', '10']\n", - "['2020-07-31 01', '42', '28,421', 'INFO', 'BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)']\n", - "['2020-07-31 01', '42', '28,421', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '28,427', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 01', '42', '28,428', 'INFO', \"ensemble_model(estimator=DecisionTreeClassifier(ccp_alpha=0.0, class_weight=None, criterion='gini',\"]\n", - "['max_depth=None, max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Boosting, fold=10, n_estimators=10, round=4, choose_better=False, optimize=Accuracy, verbose=True)\"]\n", - "['2020-07-31 01', '42', '28,428', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '28,428', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '28,429', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '28,447', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '28,447', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '28,449', 'INFO', 'Checking base model']\n", - "['2020-07-31 01', '42', '28,452', 'INFO', 'Base model', 'Decision Tree Classifier']\n", - "['2020-07-31 01', '42', '28,456', 'INFO', 'Importing untrained ensembler']\n", - "['2020-07-31 01', '42', '28,457', 'INFO', 'AdaBoostClassifier() succesfully imported']\n", - "['2020-07-31 01', '42', '28,463', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '28,463', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '28,464', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '28,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,508', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,531', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '28,536', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,568', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,577', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,591', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '28,597', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,634', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,644', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,659', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '28,665', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,708', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,718', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,735', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '28,741', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,778', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,789', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,809', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '28,817', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,858', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,868', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,885', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '28,891', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '28,920', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '28,933', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '28,953', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '28,960', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,003', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,013', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,028', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '29,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,071', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,082', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,099', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '29,103', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,134', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '29,144', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '29,161', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '29,162', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '29,174', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '29,219', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '29,219', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '29,220', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '29,282', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '29,282', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '29,283', 'INFO', \"save_model(model=AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '29,283', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '29,297', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '29,304', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123)]']\n", - "['2020-07-31 01', '42', '29,304', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '29,304', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '29,449', 'INFO', 'create_model_container', '9']\n", - "['2020-07-31 01', '42', '29,449', 'INFO', 'master_model_container', '9']\n", - "['2020-07-31 01', '42', '29,449', 'INFO', 'display_container', '11']\n", - "['2020-07-31 01', '42', '29,450', 'INFO', \"AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123)']\n", - "['2020-07-31 01', '42', '29,450', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '29,456', 'INFO', 'Initializing blend_models()']\n", - "['2020-07-31 01', '42', '29,459', 'INFO', \"blend_models(estimator_list=[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)], fold=10, round=4, choose_better=False, optimize=Accuracy, method=soft, turbo=True, verbose=True)']\n", - "['2020-07-31 01', '42', '29,459', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '29,461', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '29,461', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '29,481', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '29,481', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '29,482', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '29,482', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '29,486', 'INFO', 'Defining model names in estimator_list']\n", - "['2020-07-31 01', '42', '29,656', 'INFO', 'n_jobs multiple passed']\n", - "['2020-07-31 01', '42', '29,664', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '29,672', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '29,826', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '30,112', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '30,136', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '30,147', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '30,300', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '30,559', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '30,571', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '30,576', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '30,719', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '30,986', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '31,001', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '31,007', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '31,147', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '31,442', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '31,460', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '31,466', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '31,602', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '31,896', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '31,921', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '31,927', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '32,074', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '32,325', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '32,340', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '32,346', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '32,497', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '32,810', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '32,826', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '32,836', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '32,985', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '33,258', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '33,272', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '33,281', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '33,422', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '33,716', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '33,731', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '33,736', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '33,878', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '34,182', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '34,205', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '34,206', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '34,219', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '34,367', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '34,368', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '34,368', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '34,421', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '34,422', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '34,429', 'INFO', \"save_model(model=VotingClassifier(estimators=[('Bagging Classifier_1',\"]\n", - "['BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['r...']\n", - "['max_depth=30,']\n", - "[\"max_features='auto',\"]\n", - "['max_leaf_nodes=None,']\n", - "['max_samples=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False,']\n", - "['random_state=123,']\n", - "['verbose=0,']\n", - "['warm_start=False))],']\n", - "['flatten_transform=True, n_jobs=-1, verbose=False,']\n", - "[\"voting='soft', weights=None), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '42', '34,429', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '34,478', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '34,488', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), VotingClassifier(estimators=[('Bagging Classifier_1',\"]\n", - "['BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['r...']\n", - "['max_depth=30,']\n", - "[\"max_features='auto',\"]\n", - "['max_leaf_nodes=None,']\n", - "['max_samples=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False,']\n", - "['random_state=123,']\n", - "['verbose=0,']\n", - "['warm_start=False))],']\n", - "['flatten_transform=True, n_jobs=-1, verbose=False,']\n", - "[\"voting='soft', weights=None)]\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '34,489', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '34,489', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '34,946', 'INFO', 'create_model_container', '10']\n", - "['2020-07-31 01', '42', '34,947', 'INFO', 'master_model_container', '10']\n", - "['2020-07-31 01', '42', '34,947', 'INFO', 'display_container', '12']\n", - "['2020-07-31 01', '42', '34,953', 'INFO', \"VotingClassifier(estimators=[('Bagging Classifier_1',\"]\n", - "['BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['r...']\n", - "['max_depth=30,']\n", - "[\"max_features='auto',\"]\n", - "['max_leaf_nodes=None,']\n", - "['max_samples=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False,']\n", - "['random_state=123,']\n", - "['verbose=0,']\n", - "['warm_start=False))],']\n", - "['flatten_transform=True, n_jobs=-1, verbose=False,']\n", - "[\"voting='soft', weights=None)\"]\n", - "['2020-07-31 01', '42', '34,954', 'INFO', 'blend_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '34,961', 'INFO', 'Initializing stack_models()']\n", - "['2020-07-31 01', '42', '34,963', 'INFO', \"stack_models(estimator_list=[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False)], meta_model=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), fold=10, round=4, method=soft, restack=True, plot=False, choose_better=False, optimize=Accuracy, finalize=False, verbose=True)']\n", - "['2020-07-31 01', '42', '34,964', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '34,965', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '34,965', 'INFO', 'Copying estimator list']\n", - "['2020-07-31 01', '42', '34,970', 'INFO', 'Defining meta model']\n", - "['2020-07-31 01', '42', '34,972', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '34,990', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '34,991', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '34,993', 'INFO', 'Getting model names']\n", - "['2020-07-31 01', '42', '34,995', 'INFO', 'Checking base model', 'AdaBoostClassifier']\n", - "['2020-07-31 01', '42', '34,999', 'INFO', 'Fitting base model']\n", - "['2020-07-31 01', '42', '35,039', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 01', '42', '35,373', 'INFO', 'Checking base model', 'BaggingClassifier']\n", - "['2020-07-31 01', '42', '35,378', 'INFO', 'Fitting base model']\n", - "['2020-07-31 01', '42', '35,408', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 01', '42', '35,751', 'INFO', 'Checking base model', 'RandomForestClassifier']\n", - "['2020-07-31 01', '42', '35,751', 'INFO', 'Fitting base model']\n", - "['2020-07-31 01', '42', '35,872', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 01', '42', '37,647', 'INFO', 'Base layer complete']\n", - "['2020-07-31 01', '42', '37,802', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '37,804', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '37,809', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '37,921', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '38,152', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '38,166', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '38,172', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '38,289', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '38,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '38,540', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '38,554', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '38,673', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '38,892', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '38,922', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '38,929', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '39,040', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '39,259', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '39,274', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '39,286', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '39,406', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '39,641', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '39,660', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '39,660', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '39,792', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '40,042', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '40,064', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '40,070', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '40,189', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '40,439', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '40,454', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '40,461', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '40,574', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '40,793', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '40,808', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '40,816', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '40,938', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '41,188', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '41,209', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '41,215', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '41,339', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '41,557', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '41,572', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '41,572', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '41,583', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '41,583', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 01', '42', '41,583', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '41,658', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '41,658', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '41,658', 'INFO', \"save_model(model=[AdaBoostClassifier(algorithm='SAMME.R',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True], model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 01', '42', '41,658', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '41,674', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '41,690', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), [AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True]]\"]\n", - "['2020-07-31 01', '42', '41,690', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '41,690', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'create_model_container', '11']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'master_model_container', '11']\n", - "['2020-07-31 01', '42', '42,222', 'INFO', 'display_container', '13']\n", - "['2020-07-31 01', '42', '42,224', 'INFO', \"[AdaBoostClassifier(algorithm='SAMME.R',\"]\n", - "['base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['learning_rate=1.0, n_estimators=10, random_state=123), BaggingClassifier(base_estimator=DecisionTreeClassifier(ccp_alpha=0.0,']\n", - "['class_weight=None,']\n", - "[\"criterion='gini',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=10, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=30, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=10,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=30, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "[\"warm_start=False), 'soft', True]\"]\n", - "['2020-07-31 01', '42', '42,224', 'INFO', 'stack_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '42,230', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '42,231', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=auc, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '42,231', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'Preparing display monitor']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '42,342', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '42,342', 'INFO', 'plot type', 'auc']\n", - "['2020-07-31 01', '42', '42,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '42,413', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '42', '42,806', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '42,806', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '42,819', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '42,820', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=confusion_matrix, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '42,820', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '42,926', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '42,926', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '42,941', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '42,941', 'INFO', 'plot type', 'confusion_matrix']\n", - "['2020-07-31 01', '42', '42,957', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '42,957', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '42', '43,239', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '43,239', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '43,245', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '43,246', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=boundary, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '43,246', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '43,359', 'INFO', 'plot type', 'boundary']\n", - "['2020-07-31 01', '42', '43,491', 'INFO', 'Fitting StandardScaler()']\n", - "['2020-07-31 01', '42', '43,497', 'INFO', 'Fitting PCA()']\n", - "['2020-07-31 01', '42', '43,525', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '44,935', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '44,935', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '44,969', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '42', '44,970', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=parameter, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '44,970', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '45,076', 'INFO', 'plot type', 'parameter']\n", - "['2020-07-31 01', '42', '45,092', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '45,092', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'create_model(estimator=catboost, ensemble=False, method=None, fold=10, round=4, cross_validation=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '45,100', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '45,120', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '45,121', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '45,122', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '45,122', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '45,127', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '45,128', 'INFO', 'CatBoost Classifier Imported succesfully']\n", - "['2020-07-31 01', '42', '45,128', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '45,133', 'INFO', 'Cross validation set to False']\n", - "['2020-07-31 01', '42', '45,134', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'create_model_container 11']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'master_model_container 11']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'display_container 13']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', '']\n", - "['2020-07-31 01', '42', '46,706', 'INFO', 'create_models() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'interpret_model(estimator=, plot=summary, feature=None, observation=None)']\n", - "['2020-07-31 01', '42', '46,719', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'plot type', 'summary']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '47,417', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '47,714', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '48,401', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '48,401', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'interpret_model(estimator=, plot=correlation, feature=None, observation=None)']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'plot type', 'correlation']\n", - "['2020-07-31 01', '42', '48,424', 'WARNING', 'No feature passed. Default value of feature used for correlation plot', 'WeekofPurchase']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '48,424', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 01', '42', '48,742', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '49,226', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '49,226', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '49,245', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 01', '42', '49,245', 'INFO', 'interpret_model(estimator=, plot=reason, feature=None, observation=12)']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'plot type', 'reason']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'model type detected', 'type 2']\n", - "['2020-07-31 01', '42', '49,246', 'INFO', 'Creating TreeExplainer']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '42', '49,564', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 01', '42', '49,970', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '42', '49,970', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'Initializing automl()']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'automl(optimize=Recall, use_holdout=False)']\n", - "['2020-07-31 01', '42', '50,001', 'INFO', 'Model Selection Basis', 'CV Results on Training set']\n", - "['2020-07-31 01', '42', '50,007', 'INFO', 'SubProcess finalize_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,008', 'INFO', 'Initializing finalize_model()']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', \"finalize_model(estimator=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False))']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Getting model name']\n", - "['2020-07-31 01', '42', '50,009', 'INFO', 'Finalizing Logistic Regression']\n", - "['2020-07-31 01', '42', '50,038', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 01', '42', '50,073', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,073', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', \"create_model(estimator=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '42', '50,074', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '42', '50,082', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 01', '42', '50,082', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Defining folds']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Importing untrained model']\n", - "['2020-07-31 01', '42', '50,083', 'INFO', 'Declaring custom model']\n", - "['2020-07-31 01', '42', '50,084', 'INFO', 'Logistic Regression Imported succesfully']\n", - "['2020-07-31 01', '42', '50,085', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 01', '42', '50,087', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 01', '42', '50,088', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,114', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,126', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 01', '42', '50,128', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,152', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,158', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,162', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 01', '42', '50,163', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,181', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 01', '42', '50,196', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,212', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,228', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 01', '42', '50,228', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,243', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 01', '42', '50,259', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,275', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 01', '42', '50,290', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,306', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 01', '42', '50,321', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 01', '42', '50,353', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,389', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,402', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,407', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 01', '42', '50,409', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '42', '50,430', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 01', '42', '50,431', 'INFO', 'Finalizing model']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'Uploading model into container now']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'display_container', '14']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,462', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,509', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'display_container', '14']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'finalize_model() succesfully completed......................................']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'SubProcess finalize_model() end ==================================']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '42', '50,556', 'INFO', 'automl() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '01,294', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '45', '01,295', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=best-model, verbose=True)']\n", - "['2020-07-31 01', '45', '01,295', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '45', '01,303', 'INFO', 'best-model.pkl saved in current working directory']\n", - "['2020-07-31 01', '45', '01,308', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '45', '01,309', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '03,776', 'INFO', 'Initializing deploy_model()']\n", - "['2020-07-31 01', '45', '03,776', 'INFO', \"deploy_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "[\"warm_start=False), model_name=best-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", - "['2020-07-31 01', '45', '03,798', 'INFO', 'Platform', 'AWS S3']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'Saving model in active working directory']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 01', '45', '03,997', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 01', '45', '03,998', 'INFO', \"save_model(model=LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False), model_name=best-aws, verbose=False)']\n", - "['2020-07-31 01', '45', '03,998', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 01', '45', '04,004', 'INFO', 'best-aws.pkl saved in current working directory']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='classification',\"]\n", - "[\"numerical_features=[], target='Purchase',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_L...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='Purchase')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)]']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 01', '45', '04,008', 'INFO', 'Initializing S3 client']\n", - "['2020-07-31 01', '45', '04,989', 'INFO', \"LogisticRegression(C=5.5600000000000005, class_weight='balanced', dual=False,\"]\n", - "['fit_intercept=True, intercept_scaling=1, l1_ratio=None,']\n", - "[\"max_iter=100, multi_class='auto', n_jobs=-1, penalty='l2',\"]\n", - "[\"random_state=123, solver='lbfgs', tol=0.0001, verbose=0,\"]\n", - "['warm_start=False)']\n", - "['2020-07-31 01', '45', '04,989', 'INFO', 'deploy_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'get_config(variable=X_train)']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'Global variable', 'X_train returned']\n", - "['2020-07-31 01', '45', '05,013', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,044', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,044', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 01', '45', '05,045', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 01', '45', '05,045', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'Initializing set_config()']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'set_config(variable=seed, value=999)']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'Global variable', 'seed updated']\n", - "['2020-07-31 01', '45', '05,495', 'INFO', 'set_config() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 01', '45', '05,898', 'INFO', 'get_config() succesfully completed......................................']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 01', '45', '23,821', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '23,822', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=FEATURE, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '23,822', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '27,575', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '27,577', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=feature, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '27,577', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '45', '27,691', 'INFO', 'plot type', 'feature']\n", - "['2020-07-31 01', '45', '27,691', 'WARNING', 'No coef_ found. Trying feature_importances_']\n", - "['2020-07-31 01', '45', '27,906', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '45', '27,906', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '31,933', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '31,934', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=pr, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '31,934', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'plot type', 'pr']\n", - "['2020-07-31 01', '45', '32,042', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '45', '32,057', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '45', '32,376', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '45', '32,376', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 01', '45', '42,906', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 01', '45', '42,907', 'INFO', 'plot_model(estimator=RandomForestClassifier(bootstrap=True, ccp_alpha=0.0, class_weight=None,']\n", - "[\"criterion='gini', max_depth=None, max_features='auto',\"]\n", - "['max_leaf_nodes=None, max_samples=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=10, n_jobs=-1,']\n", - "['oob_score=False, random_state=123, verbose=0,']\n", - "['warm_start=False), plot=class_report, save=False, verbose=True, system=True)']\n", - "['2020-07-31 01', '45', '42,907', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'Importing libraries']\n", - "['2020-07-31 01', '45', '43,013', 'INFO', 'plot type', 'class_report']\n", - "['2020-07-31 01', '45', '43,032', 'INFO', 'Fitting Model']\n", - "['2020-07-31 01', '45', '43,033', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 01', '45', '43,362', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 01', '45', '43,362', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '16,732', 'INFO', 'PyCaret Regression Module']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'version 2.0']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'USI', '5b1c']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'setup(data=(1338, 7), target=charges, train_size=0.7, sampling=True, sample_estimator=None, categorical_features=None, categorical_imputation=constant, ordinal_features=None,']\n", - "['high_cardinality_features=None, high_cardinality_method=frequency, numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=None, normalize=False,']\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None, remove_outliers=False, outliers_threshold=0.05,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, remove_perfect_collinearity=False, create_clusters=False, cluster_iter=20,']\n", - "['polynomial_features=False, polynomial_degree=2, trigonometry_features=False, polynomial_threshold=0.1, group_features=None,']\n", - "['group_names=None, feature_selection=False, feature_selection_threshold=0.8, feature_interaction=False, feature_ratio=False, interaction_threshold=0.01, transform_target=False,']\n", - "['transform_target_method=box-cox, data_split_shuffle=True, folds_shuffle=False, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=insurance1, log_plots=False, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'Checking environment']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 08', '44', '16,733', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 08', '44', '16,734', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Memory', 'svmem(total=17032478720, available=12508303360, percent=26.6, used=4524175360, free=12508303360)']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'Checking libraries']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 08', '44', '16,785', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 08', '44', '17,421', 'INFO', 'sklearn==0.23.1']\n", - "['2020-07-31 08', '44', '17,518', 'INFO', 'xgboost==0.90']\n", - "['2020-07-31 08', '44', '17,654', 'INFO', 'lightgbm==2.3.1']\n", - "['2020-07-31 08', '44', '17,720', 'INFO', 'catboost==0.20.2']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'mlflow==1.8.0']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Checking Exceptions']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '44', '19,702', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '44', '21,667', 'INFO', 'Copying data for preprocessing']\n", - "['2020-07-31 08', '44', '21,667', 'INFO', 'Declaring global variables']\n", - "['2020-07-31 08', '44', '21,672', 'INFO', 'Declaring preprocessing parameters']\n", - "['2020-07-31 08', '44', '21,672', 'INFO', 'Importing preprocessing module']\n", - "['2020-07-31 08', '44', '22,570', 'INFO', 'Creating preprocessing pipeline']\n", - "['2020-07-31 08', '44', '23,523', 'INFO', 'Preprocessing pipeline created successfully']\n", - "['2020-07-31 08', '44', '23,523', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '23,523', 'INFO', 'Creating grid variables']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '23,525', 'INFO', 'Creating global containers']\n", - "['2020-07-31 08', '44', '23,590', 'INFO', 'Logging experiment in MLFlow']\n", - "['2020-07-31 08', '44', '23,723', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '23,724', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '23,728', 'INFO', 'save_model(model=Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), model_name=Transformation Pipeline, verbose=False)']\n", - "['2020-07-31 08', '44', '23,728', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '23,732', 'INFO', 'Transformation Pipeline.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '23,740', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), None]']\n", - "['2020-07-31 08', '44', '23,740', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '23,740', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'create_model_container', '0']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'master_model_container', '0']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'display_container', '0']\n", - "['2020-07-31 08', '44', '23,806', 'INFO', 'setup() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'compare_models(blacklist=None, whitelist=None, fold=5, round=4, sort=R2, n_select=1, turbo=True, verbose=True)']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '44', '25,731', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '44', '25,754', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '44', '25,756', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '44', '25,767', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 08', '44', '25,768', 'INFO', 'Import successful']\n", - "['2020-07-31 08', '44', '25,774', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '44', '25,774', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '44', '25,774', 'INFO', 'Initializing Linear Regression']\n", - "['2020-07-31 08', '44', '25,782', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '25,788', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,795', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,796', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,797', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,856', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '25,873', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,876', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,877', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,877', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,883', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '25,888', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,892', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,894', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,894', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,900', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '25,905', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,907', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,909', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,909', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,915', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '25,920', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '25,923', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '25,925', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '25,925', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '25,931', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '25,932', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '25,940', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '25,990', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '25,990', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '25,991', 'INFO', 'save_model(model=LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '25,991', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '25,995', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '25,999', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), None]']\n", - "['2020-07-31 08', '44', '25,999', 'INFO', 'save_model() succesfully completed......................................']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '25,999', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,024', 'INFO', 'Initializing Lasso Regression']\n", - "['2020-07-31 08', '44', '26,039', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,051', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,056', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,057', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,058', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,063', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,071', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,074', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,076', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,076', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,082', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,088', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,093', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,093', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,099', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,105', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,108', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,109', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,110', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,115', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,121', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,125', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,126', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,126', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,132', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,132', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,140', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,196', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,197', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,197', 'INFO', 'save_model(model=Lasso(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=1000,']\n", - "['normalize=False, positive=False, precompute=False, random_state=123,']\n", - "[\"selection='cyclic', tol=0.0001, warm_start=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '26,197', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,201', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,205', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Lasso(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=1000,']\n", - "['normalize=False, positive=False, precompute=False, random_state=123,']\n", - "[\"selection='cyclic', tol=0.0001, warm_start=False), None]\"]\n", - "['2020-07-31 08', '44', '26,206', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,206', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,250', 'INFO', 'Initializing Ridge Regression']\n", - "['2020-07-31 08', '44', '26,255', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,260', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,265', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,266', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,266', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,272', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,278', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,281', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,283', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,283', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,289', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,294', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,297', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,298', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,298', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,304', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,309', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,312', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,314', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,314', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,320', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,325', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,329', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,330', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,330', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,336', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,336', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,346', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'save_model(model=Ridge(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=None,']\n", - "[\"normalize=False, random_state=123, solver='auto', tol=0.001), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '26,403', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,407', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,413', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Ridge(alpha=1.0, copy_X=True, fit_intercept=True, max_iter=None,']\n", - "[\"normalize=False, random_state=123, solver='auto', tol=0.001), None]\"]\n", - "['2020-07-31 08', '44', '26,413', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,413', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,453', 'INFO', 'Initializing Elastic Net']\n", - "['2020-07-31 08', '44', '26,458', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,463', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,467', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,468', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,468', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,474', 'INFO', 'Initializing Fold 2']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '26,480', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,483', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,485', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,485', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,490', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,496', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,498', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,500', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,500', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,505', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,511', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,514', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,517', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,517', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,523', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,528', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,530', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,532', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,532', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,538', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,538', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,552', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,618', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,618', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,618', 'INFO', 'save_model(model=ElasticNet(alpha=1.0, copy_X=True, fit_intercept=True, l1_ratio=0.5,']\n", - "['max_iter=1000, normalize=False, positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic', tol=0.0001, warm_start=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '26,619', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,623', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,627', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), ElasticNet(alpha=1.0, copy_X=True, fit_intercept=True, l1_ratio=0.5,']\n", - "['max_iter=1000, normalize=False, positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic', tol=0.0001, warm_start=False), None]\"]\n", - "['2020-07-31 08', '44', '26,627', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,628', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,667', 'INFO', 'Initializing Least Angle Regression']\n", - "['2020-07-31 08', '44', '26,672', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,678', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,684', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,686', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,686', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,692', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,698', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,703', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,705', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,705', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,710', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,716', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,721', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,723', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,723', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,728', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,735', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,742', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,744', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,744', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,751', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '26,756', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,762', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,764', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,764', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,771', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '26,772', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '26,787', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'save_model(model=Lars(copy_X=True, eps=2.220446049250313e-16, fit_intercept=True, fit_path=True,']\n", - "[\"jitter=None, n_nonzero_coefs=500, normalize=True, precompute='auto',\"]\n", - "['random_state=None, verbose=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '26,842', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '26,857', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), Lars(copy_X=True, eps=2.220446049250313e-16, fit_intercept=True, fit_path=True,']\n", - "[\"jitter=None, n_nonzero_coefs=500, normalize=True, precompute='auto',\"]\n", - "['random_state=None, verbose=False), None]']\n", - "['2020-07-31 08', '44', '26,857', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '26,857', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '26,889', 'INFO', 'Initializing Lasso Least Angle Regression']\n", - "['2020-07-31 08', '44', '26,909', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '26,918', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,923', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,924', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,924', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,932', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '26,937', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,943', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,945', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,945', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,954', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '26,961', 'INFO', 'Fitting Model']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '26,967', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,968', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,969', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,975', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '26,982', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '26,988', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '26,990', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '26,990', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '26,997', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,003', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,009', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,012', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,012', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,021', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,021', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,032', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,089', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,090', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,090', 'INFO', 'save_model(model=LassoLars(alpha=1.0, copy_X=True, eps=2.220446049250313e-16, fit_intercept=True,']\n", - "['fit_path=True, jitter=None, max_iter=500, normalize=True,']\n", - "[\"positive=False, precompute='auto', random_state=None, verbose=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '27,090', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,095', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,100', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), LassoLars(alpha=1.0, copy_X=True, eps=2.220446049250313e-16, fit_intercept=True,']\n", - "['fit_path=True, jitter=None, max_iter=500, normalize=True,']\n", - "[\"positive=False, precompute='auto', random_state=None, verbose=False), None]\"]\n", - "['2020-07-31 08', '44', '27,100', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,100', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,144', 'INFO', 'Initializing Orthogonal Matching Pursuit']\n", - "['2020-07-31 08', '44', '27,148', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,155', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,158', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,160', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,160', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,166', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,173', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,177', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,178', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,179', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,186', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '27,194', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,197', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,199', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,199', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,206', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '27,213', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,216', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,218', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,218', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,224', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,232', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,236', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,237', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,237', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,244', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,245', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,262', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,325', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,325', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,326', 'INFO', 'save_model(model=OrthogonalMatchingPursuit(fit_intercept=True, n_nonzero_coefs=None,']\n", - "[\"normalize=True, precompute='auto', tol=None), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '27,326', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,331', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,335', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), OrthogonalMatchingPursuit(fit_intercept=True, n_nonzero_coefs=None,']\n", - "[\"normalize=True, precompute='auto', tol=None), None]\"]\n", - "['2020-07-31 08', '44', '27,335', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,335', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,376', 'INFO', 'Initializing Bayesian Ridge']\n", - "['2020-07-31 08', '44', '27,381', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,387', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,393', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,395', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,396', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,403', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,410', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,415', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,417', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,417', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,423', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '27,429', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,434', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,435', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,436', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,441', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '27,447', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,455', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,457', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,457', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '27,463', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,474', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,476', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,476', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,482', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,482', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,493', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,550', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,551', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,551', 'INFO', 'save_model(model=BayesianRidge(alpha_1=1e-06, alpha_2=1e-06, alpha_init=None,']\n", - "['compute_score=False, copy_X=True, fit_intercept=True,']\n", - "['lambda_1=1e-06, lambda_2=1e-06, lambda_init=None, n_iter=300,']\n", - "['normalize=False, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '27,551', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,556', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,559', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), BayesianRidge(alpha_1=1e-06, alpha_2=1e-06, alpha_init=None,']\n", - "['compute_score=False, copy_X=True, fit_intercept=True,']\n", - "['lambda_1=1e-06, lambda_2=1e-06, lambda_init=None, n_iter=300,']\n", - "['normalize=False, tol=0.001, verbose=False), None]']\n", - "['2020-07-31 08', '44', '27,559', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,559', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,590', 'INFO', 'Initializing Passive Aggressive Regressor']\n", - "['2020-07-31 08', '44', '27,606', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,619', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,620', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,620', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,626', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,631', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,638', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,640', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,640', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,645', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '27,651', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,656', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,658', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,658', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,664', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '27,669', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,675', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,677', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,677', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,683', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '27,687', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,694', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,696', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,696', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,701', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '27,702', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '27,712', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '27,773', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '27,773', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '27,774', 'INFO', 'save_model(model=PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']\n", - "['epsilon=0.1, fit_intercept=True,']\n", - "[\"loss='epsilon_insensitive', max_iter=1000,\"]\n", - "['n_iter_no_change=5, random_state=123, shuffle=True,']\n", - "['tol=0.001, validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '27,774', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '27,775', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '27,783', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), PassiveAggressiveRegressor(C=1.0, average=False, early_stopping=False,']\n", - "['epsilon=0.1, fit_intercept=True,']\n", - "[\"loss='epsilon_insensitive', max_iter=1000,\"]\n", - "['n_iter_no_change=5, random_state=123, shuffle=True,']\n", - "['tol=0.001, validation_fraction=0.1, verbose=0,']\n", - "['warm_start=False), None]']\n", - "['2020-07-31 08', '44', '27,783', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '27,783', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '27,826', 'INFO', 'Initializing Random Sample Consensus']\n", - "['2020-07-31 08', '44', '27,831', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '27,836', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '27,923', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '27,924', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '27,924', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '27,930', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '27,935', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,015', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,017', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,017', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,022', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '28,027', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,105', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,106', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,106', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,112', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '28,116', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '28,195', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,197', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,197', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,202', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '28,208', 'INFO', 'Fitting Model']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '28,298', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '28,300', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '28,300', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '28,306', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '28,306', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '28,322', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'save_model(model=RANSACRegressor(base_estimator=None, is_data_valid=None, is_model_valid=None,']\n", - "[\"loss='absolute_loss', max_skips=inf, max_trials=100,\"]\n", - "['min_samples=0.5, random_state=123, residual_threshold=None,']\n", - "['stop_n_inliers=inf, stop_probability=0.99, stop_score=inf), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '28,377', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '28,396', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), RANSACRegressor(base_estimator=None, is_data_valid=None, is_model_valid=None,']\n", - "[\"loss='absolute_loss', max_skips=inf, max_trials=100,\"]\n", - "['min_samples=0.5, random_state=123, residual_threshold=None,']\n", - "['stop_n_inliers=inf, stop_probability=0.99, stop_score=inf), None]']\n", - "['2020-07-31 08', '44', '28,396', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '28,396', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '28,441', 'INFO', 'Initializing TheilSen Regressor']\n", - "['2020-07-31 08', '44', '28,446', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '28,450', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '30,326', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '30,328', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '30,328', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '30,334', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '30,339', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '30,808', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '30,808', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '30,808', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '30,824', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '30,830', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '31,292', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '31,292', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '31,292', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '31,307', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '31,313', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '31,820', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '31,822', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '31,822', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '31,827', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '31,827', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,321', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,321', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,321', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,336', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '32,336', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '32,353', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '32,409', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '32,409', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'save_model(model=TheilSenRegressor(copy_X=True, fit_intercept=True, max_iter=300,']\n", - "['max_subpopulation=10000, n_jobs=-1, n_subsamples=None,']\n", - "['random_state=123, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), TheilSenRegressor(copy_X=True, fit_intercept=True, max_iter=300,']\n", - "['max_subpopulation=10000, n_jobs=-1, n_subsamples=None,']\n", - "['random_state=123, tol=0.001, verbose=False), None]']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '32,410', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '32,457', 'INFO', 'Initializing Huber Regressor']\n", - "['2020-07-31 08', '44', '32,457', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '32,468', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,520', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,522', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,522', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,527', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '32,527', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,579', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,580', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,580', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,586', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '32,591', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,636', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,638', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,638', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,643', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '32,650', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,690', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,692', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,692', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,697', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '32,702', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,749', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,750', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,750', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,756', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '32,756', 'INFO', 'Creating metrics dataframe']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '32,761', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '32,821', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '32,822', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '32,822', 'INFO', 'save_model(model=HuberRegressor(alpha=0.0001, epsilon=1.35, fit_intercept=True, max_iter=100,']\n", - "['tol=1e-05, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '32,822', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '32,827', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '32,831', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), HuberRegressor(alpha=0.0001, epsilon=1.35, fit_intercept=True, max_iter=100,']\n", - "['tol=1e-05, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '32,831', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '32,831', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '32,860', 'INFO', 'Initializing Support Vector Machine']\n", - "['2020-07-31 08', '44', '32,860', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '32,880', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,938', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,942', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,943', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,948', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '32,953', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '32,976', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '32,981', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '32,981', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '32,986', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '32,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,013', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,018', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,018', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,024', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '33,029', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,053', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,058', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,058', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,062', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '33,067', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,096', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,096', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,101', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '33,102', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '33,113', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '33,175', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '33,176', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '33,176', 'INFO', \"save_model(model=SVR(C=1.0, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma='scale',\"]\n", - "[\"kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '33,176', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '33,177', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '33,177', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), SVR(C=1.0, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma='scale',\"]\n", - "[\"kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False), None]\"]\n", - "['2020-07-31 08', '44', '33,177', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '33,177', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '33,211', 'INFO', 'Initializing K Neighbors Regressor']\n", - "['2020-07-31 08', '44', '33,227', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '33,227', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,227', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,358', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,358', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,373', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '33,383', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,388', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,507', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,507', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,507', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '33,519', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,523', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,641', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,641', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,657', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '33,669', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,674', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,780', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,780', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,788', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '33,794', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '33,798', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '33,908', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '33,945', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '34,004', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '34,005', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '34,005', 'INFO', \"save_model(model=KNeighborsRegressor(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '34,005', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '34,010', 'INFO', 'Trained Model.pkl saved in current working directory']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '34,011', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), KNeighborsRegressor(algorithm='auto', leaf_size=30, metric='minkowski',\"]\n", - "['metric_params=None, n_jobs=-1, n_neighbors=5, p=2,']\n", - "[\"weights='uniform'), None]\"]\n", - "['2020-07-31 08', '44', '34,011', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '34,011', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '34,042', 'INFO', 'Initializing Decision Tree']\n", - "['2020-07-31 08', '44', '34,060', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '34,065', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,070', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,072', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,072', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,078', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '34,084', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,089', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,090', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,090', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,096', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '34,101', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,105', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,107', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,107', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,113', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '34,118', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,122', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,124', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,124', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,130', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '34,135', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,140', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,141', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,141', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,147', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '34,147', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '34,159', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '34,216', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '34,217', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '34,217', 'INFO', \"save_model(model=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '44', '34,217', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '34,222', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '34,226', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), None]\"]\n", - "['2020-07-31 08', '44', '34,226', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '34,226', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '34,259', 'INFO', 'Initializing Random Forest']\n", - "['2020-07-31 08', '44', '34,259', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '34,276', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,425', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,550', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,550', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,550', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '34,561', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '34,708', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '34,813', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '34,814', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '34,828', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '34,844', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '35,092', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '35,197', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '35,197', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '35,203', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '35,208', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '35,456', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '35,575', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '35,575', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '35,582', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '35,590', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '35,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '35,966', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '35,981', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', \"save_model(model=RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '36,045', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', '[Pipeline(memory=None,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '36,076', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '36,123', 'INFO', 'Initializing Extra Trees Regressor']\n", - "['2020-07-31 08', '44', '36,123', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '36,141', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '36,290', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '36,396', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '36,396', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '36,412', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '36,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '36,574', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '36,684', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '36,684', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '36,684', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '36,699', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '36,842', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '36,962', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '36,962', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '36,977', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '36,990', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,141', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,267', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,267', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,282', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '37,299', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,441', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '37,558', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '37,573', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', \"save_model(model=ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '37,661', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '37,693', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '37,739', 'INFO', 'Initializing AdaBoost Regressor']\n", - "['2020-07-31 08', '44', '37,739', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '37,758', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,782', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,785', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,785', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,790', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '37,797', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,817', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,820', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,820', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,827', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '37,833', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,851', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,854', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,854', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,861', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '37,866', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,882', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,884', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,884', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,891', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '37,897', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '37,916', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '37,918', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '37,918', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '37,925', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '37,925', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '37,939', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '37,998', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '37,998', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '37,999', 'INFO', \"save_model(model=AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '37,999', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '38,008', 'INFO', 'Trained Model.pkl saved in current working directory']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '38,013', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), None]']\n", - "['2020-07-31 08', '44', '38,013', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '38,013', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '38,045', 'INFO', 'Initializing Gradient Boosting Regressor']\n", - "['2020-07-31 08', '44', '38,045', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '38,066', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,130', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,145', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,145', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,145', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '38,159', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,230', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '38,245', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,318', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,320', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,320', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,326', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '38,332', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,396', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '38,415', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,484', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,486', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,486', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,492', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '38,492', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '38,508', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', \"save_model(model=GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '38,563', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '38,578', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '44', '38,578', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '38,578', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '38,625', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 08', '44', '38,625', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '38,642', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,685', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,686', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,687', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,697', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '38,711', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,753', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,755', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,755', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,773', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '38,783', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,827', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,829', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,829', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,846', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '38,855', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,899', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,901', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,901', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,914', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '38,926', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '38,968', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '38,970', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '38,970', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '38,982', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '38,983', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '39,014', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', \"save_model(model=XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '39,096', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '39,112', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), None]']\n", - "['2020-07-31 08', '44', '39,112', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '39,112', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '39,143', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 08', '44', '39,159', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '39,165', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,231', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,246', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,246', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,246', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '39,269', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,361', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,365', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,365', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,378', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '39,388', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,482', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,486', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,486', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,499', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '39,510', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,581', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,581', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,581', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,596', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '39,608', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '39,693', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '39,697', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '39,697', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '39,710', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '39,710', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '39,742', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '44', '39,836', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '39,836', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '39,837', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '39,837', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '39,848', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '39,956', 'INFO', 'Initializing CatBoost Regressor']\n", - "['2020-07-31 08', '44', '39,961', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '39,969', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '41,306', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '41,306', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '41,306', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '41,322', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '41,330', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '42,400', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '42,402', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '42,403', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '42,410', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '42,416', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '43,476', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '43,492', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '43,492', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '43,492', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '43,504', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '44,609', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '44,627', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '45,698', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '45,723', 'INFO', 'Creating MLFlow logs']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '44', '45,774', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '44', '45,775', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '44', '45,775', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '44', '45,775', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '44', '45,813', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '44', '45,834', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), , None]']\n", - "['2020-07-31 08', '44', '45,834', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '45,834', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '44', '45,916', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 08', '44', '45,916', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'create_model(estimator=xgboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '44', '45,927', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '44', '45,935', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '44', '45,935', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '44', '45,936', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '44', '45,936', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '44', '45,937', 'INFO', 'Extreme Gradient Boosting Regressor Imported succesfully']\n", - "['2020-07-31 08', '44', '45,937', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '44', '45,938', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '44', '45,939', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '45,977', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '45,979', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '45,979', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '45,990', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '44', '45,992', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,031', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,033', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,033', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,044', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '44', '46,048', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,067', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '44', '46,083', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,129', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '44', '46,145', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,176', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,176', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,176', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,192', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '44', '46,192', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,223', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,223', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,223', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,239', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '44', '46,239', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,270', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,270', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,270', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,286', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '44', '46,286', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,335', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,337', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,337', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,349', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '44', '46,350', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,397', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,397', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,397', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,412', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '44', '46,412', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '44', '46,459', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '44', '46,459', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '44', '46,459', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '44', '46,475', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '44', '46,475', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '44', '46,490', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'display_container', '1']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', \"XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '44', '46,521', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'create_model_container', '1']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'master_model_container', '1']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'display_container', '2']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', \"XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 08', '44', '46,646', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '06,693', 'INFO', 'Initializing create_model()']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '06,693', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '06,694', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '06,694', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '06,694', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '06,717', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '06,717', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '06,718', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '06,718', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '06,722', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '06,723', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '06,728', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '06,733', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '06,819', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '06,823', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '06,823', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '06,852', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '06,860', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '06,951', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '06,955', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '06,955', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '06,984', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '06,992', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,090', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,094', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,094', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,123', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '07,132', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,207', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,207', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,207', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,246', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '07,255', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,339', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,343', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,343', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,374', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '07,383', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,466', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,469', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,469', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,499', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '07,507', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,591', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,595', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,595', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,626', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '07,635', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,717', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,721', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,721', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,753', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '07,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,842', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,842', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,842', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '07,877', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '07,885', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '07,972', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '07,975', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '07,976', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '08,009', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '08,011', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '08,024', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '08,113', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '08,329', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '08,329', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '08,330', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '08,330', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '08,349', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '08,360', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '08,360', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '08,361', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '08,401', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '08,401', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'create_model_container', '2']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'master_model_container', '2']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'display_container', '3']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '08,459', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '09,734', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '09,735', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '09,754', 'INFO', 'Copying training dataset']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '09,755', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '09,756', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '09,756', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '09,761', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '09,761', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '09,766', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '09,771', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '09,853', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '09,857', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '09,857', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '09,886', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '09,894', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '09,980', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '09,984', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '09,984', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,013', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '10,023', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,104', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,108', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,108', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,137', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '10,145', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,250', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,253', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,254', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,285', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '10,294', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,393', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,396', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,397', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,426', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '10,435', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,516', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,520', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,520', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,542', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '10,565', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,650', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,654', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,654', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,685', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '10,693', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,777', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,780', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,781', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,812', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '10,821', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '10,905', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '10,910', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '10,910', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '10,948', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '10,957', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '11,041', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '11,045', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '11,045', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '11,075', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '11,077', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '11,094', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '11,191', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '11,397', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '11,397', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '11,398', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '11,399', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '11,417', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '11,427', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '11,428', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '11,428', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '11,465', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '11,465', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '11,521', 'INFO', 'create_model_container', '3']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', 'master_model_container', '3']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', 'display_container', '4']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '11,522', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '11,523', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '11,540', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '11,541', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '11,542', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '11,542', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '11,546', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '11,547', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '11,551', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '11,557', 'INFO', 'Fitting Model']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '11,638', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '11,642', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '11,642', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '11,670', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '11,679', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '11,784', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '11,788', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '11,788', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '11,812', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '11,820', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,003', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,007', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,007', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,037', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '12,046', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,125', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,126', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,126', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,159', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '12,168', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,250', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,254', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,254', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,285', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '12,294', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,383', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,387', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,387', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,417', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '12,426', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,492', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,508', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,508', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,542', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '12,550', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,660', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,663', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,664', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,698', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '12,708', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,794', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,798', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,798', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,830', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '12,838', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '12,921', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '12,925', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '12,925', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '12,959', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '12,961', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '12,975', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '13,077', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '13,302', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '13,303', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '13,304', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.2, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '13,304', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '13,323', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '13,335', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.2, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '13,335', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '13,335', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '13,373', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '13,373', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', 'create_model_container', '4']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', 'master_model_container', '4']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', 'display_container', '5']\n", - "['2020-07-31 08', '45', '13,434', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.2, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '13,435', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '13,452', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '13,452', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '13,453', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '13,453', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '13,458', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '13,458', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '13,463', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '13,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,542', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,542', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,542', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,579', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '13,588', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,659', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,659', 'INFO', 'No inverse transformation']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '13,659', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,700', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '13,708', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,776', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,776', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,776', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,820', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '13,828', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '13,910', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '13,910', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '13,910', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '13,943', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '13,951', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,043', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,043', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,043', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,081', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '14,090', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,196', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,200', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,200', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,230', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '14,240', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,334', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,337', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,338', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,370', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '14,379', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,463', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,467', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,467', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,498', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '14,507', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,588', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,592', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,592', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,625', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '14,634', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '14,732', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '14,736', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '14,736', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '14,767', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '14,769', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '14,783', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '14,871', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '15,089', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '15,090', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '15,091', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.30000000000000004,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '15,091', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '15,110', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '15,122', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.30000000000000004,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '15,122', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '15,122', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '15,159', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '15,159', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'create_model_container', '5']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'master_model_container', '5']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'display_container', '6']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.30000000000000004,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0)']\n", - "['2020-07-31 08', '45', '15,219', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '15,220', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '15,236', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '15,237', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '15,238', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '15,238', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '15,242', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '15,243', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '15,247', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '15,252', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,327', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,327', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,327', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,364', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '15,373', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,457', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,461', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,461', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,489', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '15,497', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,578', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,578', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,578', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '15,610', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '15,619', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,726', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,730', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,730', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,759', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '15,769', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '15,861', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '15,865', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '15,865', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '15,897', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '15,906', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,004', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,008', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,039', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '16,049', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,142', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,146', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,147', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,180', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '16,189', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,280', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,284', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,284', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,315', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '16,325', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,410', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,414', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,414', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,449', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '16,458', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '16,553', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '16,557', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '16,557', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '16,592', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '16,594', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '16,608', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '16,701', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '16,919', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '16,920', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '16,921', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.4, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '16,922', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '16,944', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '16,956', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.4, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '16,956', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '16,956', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '16,995', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '16,995', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '17,052', 'INFO', 'create_model_container', '6']\n", - "['2020-07-31 08', '45', '17,052', 'INFO', 'master_model_container', '6']\n", - "['2020-07-31 08', '45', '17,053', 'INFO', 'display_container', '7']\n", - "['2020-07-31 08', '45', '17,053', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.4, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '17,053', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '17,054', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '17,072', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '17,072', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '17,073', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '17,074', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '17,078', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '17,079', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '17,083', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '17,087', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,160', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,160', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,160', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,198', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '17,207', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,292', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,296', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,296', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,323', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '17,333', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,428', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,432', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,432', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,465', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '17,474', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,575', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,578', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,579', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,610', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '17,618', 'INFO', 'Fitting Model']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '17,703', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,707', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,707', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,738', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '17,744', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,830', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,834', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,834', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,865', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '17,873', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '17,945', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '17,961', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '17,961', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '17,992', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '18,001', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '18,090', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '18,094', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '18,094', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '18,128', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '18,140', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '18,227', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '18,232', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '18,232', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '18,268', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '18,276', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '18,360', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '18,364', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '18,365', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '18,399', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '18,401', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '18,414', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '18,521', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.5, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '18,779', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '18,795', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '18,811', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.5, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '18,811', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '18,811', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '18,857', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '18,857', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'create_model_container', '7']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'master_model_container', '7']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'display_container', '8']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.5, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '18,918', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '18,919', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '18,934', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '18,935', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '18,935', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '18,936', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '18,940', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '18,941', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '18,946', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '18,951', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,042', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,046', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,047', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,076', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '19,087', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,162', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,162', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,205', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '19,214', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,296', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,296', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,296', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,330', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '19,339', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,424', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,428', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,428', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,458', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '19,467', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,578', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,578', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,578', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,618', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '19,628', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,716', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,720', 'INFO', 'No inverse transformation']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '19,720', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,752', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '19,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,843', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,847', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,848', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '19,881', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '19,890', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '19,986', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '19,990', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '19,990', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,023', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '20,032', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,122', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,126', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,126', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,163', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '20,172', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,246', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,246', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,246', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,292', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '20,294', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '20,309', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '20,394', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '20,611', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '20,612', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '20,613', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.6, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '20,613', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '20,630', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '20,645', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.6, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '20,645', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '20,645', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '20,692', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '20,692', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '20,742', 'INFO', 'create_model_container', '8']\n", - "['2020-07-31 08', '45', '20,742', 'INFO', 'master_model_container', '8']\n", - "['2020-07-31 08', '45', '20,742', 'INFO', 'display_container', '9']\n", - "['2020-07-31 08', '45', '20,743', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.6, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '20,743', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '20,744', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '20,760', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '20,760', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '20,761', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '20,761', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '20,765', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '20,766', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '20,770', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '20,777', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,846', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,846', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,846', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '20,888', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '20,897', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '20,996', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '20,996', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '20,996', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,041', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '21,051', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,146', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,162', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,200', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '21,215', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,297', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,313', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,313', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,346', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '21,356', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,450', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,454', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,454', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,485', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '21,497', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,597', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,601', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,601', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,634', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '21,643', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,742', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,747', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,747', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,782', 'INFO', 'Initializing Fold 8']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '21,795', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '21,879', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '21,879', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '21,879', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '21,924', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '21,934', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '22,027', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '22,043', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '22,043', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '22,084', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '22,093', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '22,195', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '22,195', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '22,195', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '22,245', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '22,248', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '22,266', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '22,362', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '22,584', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '22,584', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '22,586', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.7000000000000001,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '22,586', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '22,609', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '22,614', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.7000000000000001,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '22,614', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '22,614', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '22,692', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '22,692', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '22,739', 'INFO', 'create_model_container', '9']\n", - "['2020-07-31 08', '45', '22,739', 'INFO', 'master_model_container', '9']\n", - "['2020-07-31 08', '45', '22,739', 'INFO', 'display_container', '10']\n", - "['2020-07-31 08', '45', '22,743', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.7000000000000001,\"]\n", - "['max_depth=-1, min_child_samples=20, min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100, n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123, reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0, subsample_for_bin=200000,']\n", - "['subsample_freq=0)']\n", - "['2020-07-31 08', '45', '22,743', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '22,744', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '22,748', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '22,799', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '22,802', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '22,803', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '22,803', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '22,812', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '22,812', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '22,827', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '22,844', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '22,930', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '22,930', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '22,930', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '22,969', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '22,979', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,064', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,064', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,064', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,098', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '23,113', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,197', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,197', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,197', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,235', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '23,244', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,330', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,331', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,331', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,365', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '23,375', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,498', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,502', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,503', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,544', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '23,554', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,660', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,664', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,664', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,699', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '23,710', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,811', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,816', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,816', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,851', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '23,861', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '23,947', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '23,947', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '23,947', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '23,987', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '23,996', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,081', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '24,081', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,081', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '24,122', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '24,132', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,229', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,229', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,229', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '24,271', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '24,273', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '24,288', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '24,380', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '24,596', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '24,597', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '24,598', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.8, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '24,598', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '24,614', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '24,614', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.8, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '24,629', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '24,629', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '24,660', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '24,660', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'create_model_container', '10']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'master_model_container', '10']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'display_container', '11']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.8, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '24,726', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '24,727', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '24,744', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '24,744', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '24,745', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '24,745', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '24,750', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '45', '24,750', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '24,755', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '24,760', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,841', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,845', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,845', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '24,875', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '24,884', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '24,965', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '24,965', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '24,965', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,005', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '25,015', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,130', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,130', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,130', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,165', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '25,165', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,280', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,280', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,280', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,318', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '25,327', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,423', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,427', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,427', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,460', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '25,469', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,572', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,577', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,577', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,612', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '25,621', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,698', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,698', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,698', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,747', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '25,755', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,832', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,832', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,832', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '25,878', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '25,887', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '25,981', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '25,986', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '25,986', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '26,023', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '26,034', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '26,137', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '26,142', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '26,142', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '26,180', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '26,182', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '26,197', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '26,299', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '26,531', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '26,532', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '26,533', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.9, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '26,533', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '26,548', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '26,564', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.9, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '26,564', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '26,564', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '26,626', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '26,626', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '26,673', 'INFO', 'create_model_container', '11']\n", - "['2020-07-31 08', '45', '26,673', 'INFO', 'master_model_container', '11']\n", - "['2020-07-31 08', '45', '26,673', 'INFO', 'display_container', '12']\n", - "['2020-07-31 08', '45', '26,675', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.9, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '26,675', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '35,225', 'INFO', 'Initializing tune_model()']\n", - "['2020-07-31 08', '45', '35,225', 'INFO', \"tune_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), fold=10, round=4, n_iter=50, custom_grid=None, optimize=MAE, choose_better=False, verbose=True)']\n", - "['2020-07-31 08', '45', '35,226', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '35,226', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '35,226', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '35,246', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '35,246', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '35,247', 'INFO', 'Checking base model']\n", - "['2020-07-31 08', '45', '35,248', 'INFO', 'Base model', 'Light Gradient Boosting Machine']\n", - "['2020-07-31 08', '45', '35,249', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '35,249', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '35,255', 'INFO', 'Defining Hyperparameters']\n", - "['2020-07-31 08', '45', '35,255', 'INFO', 'Initializing RandomizedSearchCV']\n", - "['2020-07-31 08', '45', '37,358', 'INFO', 'Random search completed']\n", - "['2020-07-31 08', '45', '37,367', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '37,377', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,389', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,392', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,423', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '37,431', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,444', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,447', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,478', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '37,488', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,500', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,504', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,536', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '37,545', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,564', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,567', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,598', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '37,608', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,621', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,625', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,656', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '37,664', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,677', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,681', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,717', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '37,726', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,738', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,741', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,778', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '37,788', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,802', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,806', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,841', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '37,851', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,863', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,866', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,903', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '37,913', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '37,926', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '37,930', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '37,967', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '37,969', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '37,984', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '37,996', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '37,996', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '37,997', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '38,113', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '38,113', 'INFO', 'Initializing save_model()']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '38,114', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.3, max_depth=70,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.2,']\n", - "['n_estimators=10, n_jobs=-1, num_leaves=10, objective=None,']\n", - "['random_state=123, reg_alpha=0.4, reg_lambda=0.1, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '38,114', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '38,121', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '38,132', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.3, max_depth=70,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.2,']\n", - "['n_estimators=10, n_jobs=-1, num_leaves=10, objective=None,']\n", - "['random_state=123, reg_alpha=0.4, reg_lambda=0.1, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '45', '38,132', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,132', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '38,394', 'INFO', 'create_model_container', '12']\n", - "['2020-07-31 08', '45', '38,394', 'INFO', 'master_model_container', '12']\n", - "['2020-07-31 08', '45', '38,395', 'INFO', 'display_container', '13']\n", - "['2020-07-31 08', '45', '38,395', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.3, max_depth=70,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.2,']\n", - "['n_estimators=10, n_jobs=-1, num_leaves=10, objective=None,']\n", - "['random_state=123, reg_alpha=0.4, reg_lambda=0.1, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n", - "['2020-07-31 08', '45', '38,395', 'INFO', 'tune_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,408', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'create_model(estimator=dt, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=True, system=True)']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '38,409', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '38,428', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '38,428', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '38,429', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '38,430', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '38,435', 'INFO', 'Decision Tree Regressor Imported succesfully']\n", - "['2020-07-31 08', '45', '38,437', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '45', '38,440', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '38,446', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,451', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,453', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,453', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,467', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '38,472', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,478', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,479', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,479', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,493', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '38,500', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,505', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,507', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,507', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,521', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '38,527', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,532', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,534', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,534', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,549', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '38,555', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,560', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,562', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,562', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,577', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '38,583', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,588', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,590', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,590', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,606', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '38,612', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,617', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,619', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,619', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,635', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '38,640', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,647', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,648', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,648', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,664', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '38,671', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,675', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,677', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,677', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,693', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '38,698', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '38,704', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '38,705', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '45', '38,705', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '38,722', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '38,723', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '38,731', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '38,739', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '38,888', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '38,888', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '38,889', 'INFO', \"save_model(model=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), model_name=Trained Model, verbose=False)\"]\n", - "['2020-07-31 08', '45', '38,889', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '38,895', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '38,900', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), None]\"]\n", - "['2020-07-31 08', '45', '38,900', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,901', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '38,918', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '38,918', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '38,949', 'INFO', 'create_model_container', '13']\n", - "['2020-07-31 08', '45', '38,949', 'INFO', 'master_model_container', '13']\n", - "['2020-07-31 08', '45', '38,949', 'INFO', 'display_container', '14']\n", - "['2020-07-31 08', '45', '38,950', 'INFO', \"DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best')\"]\n", - "['2020-07-31 08', '45', '38,950', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', \"ensemble_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Bagging, fold=10, n_estimators=50, round=4, choose_better=False, optimize=R2, verbose=True)\"]\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '38,955', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '38,978', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '38,978', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '38,980', 'INFO', 'Checking base model']\n", - "['2020-07-31 08', '45', '38,981', 'INFO', 'Base model', 'Decision Tree']\n", - "['2020-07-31 08', '45', '38,985', 'INFO', 'BaggingRegressor() succesfully imported']\n", - "['2020-07-31 08', '45', '38,990', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '38,991', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '38,996', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,156', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,162', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,178', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '39,183', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,330', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,335', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,350', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '39,355', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,486', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,486', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,515', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '39,521', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,651', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,666', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,684', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '39,689', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,816', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,816', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '39,844', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '39,849', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '39,986', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '39,986', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,007', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '40,012', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,154', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,154', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,178', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '40,183', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,327', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,332', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,348', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '40,353', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,503', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,528', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '40,533', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '40,698', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '40,704', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '40,721', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '40,722', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '40,730', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '40,882', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '40,882', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '40,883', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '40,950', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '40,951', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '40,952', 'INFO', 'save_model(model=BaggingRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '40,952', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '40,976', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '40,981', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['verbose=False), BaggingRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '45', '40,981', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '40,981', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'create_model_container', '14']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'master_model_container', '14']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'display_container', '15']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'BaggingRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "['bootstrap=True, bootstrap_features=False, max_features=1.0,']\n", - "['max_samples=1.0, n_estimators=50, n_jobs=None, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)']\n", - "['2020-07-31 08', '45', '41,120', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '41,133', 'INFO', 'Initializing ensemble_model()']\n", - "['2020-07-31 08', '45', '41,134', 'INFO', \"ensemble_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), method=Boosting, fold=10, n_estimators=10, round=4, choose_better=False, optimize=R2, verbose=True)\"]\n", - "['2020-07-31 08', '45', '41,134', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '41,134', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '41,134', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '41,157', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '41,157', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '41,159', 'INFO', 'Checking base model']\n", - "['2020-07-31 08', '45', '41,160', 'INFO', 'Base model', 'Decision Tree']\n", - "['2020-07-31 08', '45', '41,166', 'INFO', 'AdaBoostRegressor() succesfully imported']\n", - "['2020-07-31 08', '45', '41,172', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '41,172', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '41,179', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,212', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,214', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,228', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '41,233', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,265', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,268', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,283', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '41,288', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,322', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,325', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,339', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '41,345', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,378', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,380', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,395', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '41,399', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,443', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,445', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,460', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '45', '41,465', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,496', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,499', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,516', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '45', '41,521', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,555', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,557', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,573', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '45', '41,578', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,616', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,619', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,638', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '45', '41,644', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,686', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,690', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,707', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '45', '41,713', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '41,749', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '41,751', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '41,768', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '45', '41,768', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '45', '41,776', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '45', '41,814', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '45', '41,814', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '45', '41,814', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '45', '41,869', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '45', '41,869', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '45', '41,870', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '45', '41,871', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '45', '41,878', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '45', '41,883', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '45', '41,883', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '41,883', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '45', '42,011', 'INFO', 'create_model_container', '15']\n", - "['2020-07-31 08', '45', '42,011', 'INFO', 'master_model_container', '15']\n", - "['2020-07-31 08', '45', '42,011', 'INFO', 'display_container', '16']\n", - "['2020-07-31 08', '45', '42,012', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '45', '42,012', 'INFO', 'ensemble_model() succesfully completed......................................']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Initializing blend_models()']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'blend_models(estimator_list=All, fold=10, round=4, choose_better=False, optimize=R2, turbo=True, verbose=True)']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '45', '42,017', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '45', '42,034', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '45', '42,034', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '45', '42,036', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '45', '42,036', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '45', '42,041', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 08', '45', '42,041', 'INFO', 'Import successful']\n", - "['2020-07-31 08', '45', '42,042', 'INFO', 'Defining model names in estimator_list']\n", - "['2020-07-31 08', '45', '45,250', 'INFO', 'n_jobs multiple passed']\n", - "['2020-07-31 08', '45', '45,265', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '45', '45,280', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '48,335', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '48,715', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '48,739', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '45', '48,753', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '51,531', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '51,907', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '51,935', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '45', '51,944', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '54,960', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '55,340', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '55,370', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '45', '55,380', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '45', '58,319', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '45', '58,719', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '45', '58,743', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '45', '58,761', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '01,634', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '02,022', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '02,053', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '02,064', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '04,996', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '05,375', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '05,404', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '05,415', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '08,454', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '08,850', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '08,884', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '08,894', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '11,712', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '12,102', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '12,118', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '12,134', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '14,865', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '15,254', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '15,270', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '15,286', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '18,564', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '18,970', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '19,005', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '19,007', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '19,022', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '22,593', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '22,593', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '22,594', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '22,641', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '22,642', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '22,679', 'INFO', \"save_model(model=VotingRegressor(estimators=[('Linear Regression_0',\"]\n", - "['LinearRegression(copy_X=True, fit_intercept=True,']\n", - "['n_jobs=-1, normalize=False)),']\n", - "[\"('Lasso_1',\"]\n", - "['Lasso(alpha=1.0, copy_X=True, fit_intercept=True,']\n", - "['max_iter=1000, normalize=False,']\n", - "['positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic',\"]\n", - "['tol=0.0001, warm_start=False)),']\n", - "[\"('Ridge_2',\"]\n", - "['Ridge(alpha=1.0, copy_X=True...']\n", - "['min_child_samples=20,']\n", - "['min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100,']\n", - "['n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123,']\n", - "['reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0,']\n", - "['subsample_for_bin=200000,']\n", - "['subsample_freq=0)),']\n", - "[\"('CatBoost Regressor_21',\"]\n", - "[')],']\n", - "['n_jobs=-1, verbose=False, weights=None), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '22,679', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '22,831', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '22,915', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), VotingRegressor(estimators=[('Linear Regression_0',\"]\n", - "['LinearRegression(copy_X=True, fit_intercept=True,']\n", - "['n_jobs=-1, normalize=False)),']\n", - "[\"('Lasso_1',\"]\n", - "['Lasso(alpha=1.0, copy_X=True, fit_intercept=True,']\n", - "['max_iter=1000, normalize=False,']\n", - "['positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic',\"]\n", - "['tol=0.0001, warm_start=False)),']\n", - "[\"('Ridge_2',\"]\n", - "['Ridge(alpha=1.0, copy_X=True...']\n", - "['min_child_samples=20,']\n", - "['min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100,']\n", - "['n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123,']\n", - "['reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0,']\n", - "['subsample_for_bin=200000,']\n", - "['subsample_freq=0)),']\n", - "[\"('CatBoost Regressor_21',\"]\n", - "[')],']\n", - "['n_jobs=-1, verbose=False, weights=None), None]']\n", - "['2020-07-31 08', '46', '22,915', 'INFO', 'save_model() succesfully completed......................................']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '46', '22,915', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '23,715', 'INFO', 'create_model_container', '16']\n", - "['2020-07-31 08', '46', '23,715', 'INFO', 'master_model_container', '16']\n", - "['2020-07-31 08', '46', '23,715', 'INFO', 'display_container', '17']\n", - "['2020-07-31 08', '46', '23,735', 'INFO', \"VotingRegressor(estimators=[('Linear Regression_0',\"]\n", - "['LinearRegression(copy_X=True, fit_intercept=True,']\n", - "['n_jobs=-1, normalize=False)),']\n", - "[\"('Lasso_1',\"]\n", - "['Lasso(alpha=1.0, copy_X=True, fit_intercept=True,']\n", - "['max_iter=1000, normalize=False,']\n", - "['positive=False, precompute=False,']\n", - "[\"random_state=123, selection='cyclic',\"]\n", - "['tol=0.0001, warm_start=False)),']\n", - "[\"('Ridge_2',\"]\n", - "['Ridge(alpha=1.0, copy_X=True...']\n", - "['min_child_samples=20,']\n", - "['min_child_weight=0.001,']\n", - "['min_split_gain=0.0, n_estimators=100,']\n", - "['n_jobs=-1, num_leaves=31,']\n", - "['objective=None, random_state=123,']\n", - "['reg_alpha=0.0, reg_lambda=0.0,']\n", - "['silent=True, subsample=1.0,']\n", - "['subsample_for_bin=200000,']\n", - "['subsample_freq=0)),']\n", - "[\"('CatBoost Regressor_21',\"]\n", - "[')],']\n", - "['n_jobs=-1, verbose=False, weights=None)']\n", - "['2020-07-31 08', '46', '23,735', 'INFO', 'blend_models() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Initializing compare_models()']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', \"compare_models(blacklist=None, whitelist=['rf', 'et', 'ada', 'gbr', 'xgboost', 'lightgbm', 'catboost'], fold=5, round=4, sort=R2, n_select=5, turbo=True, verbose=True)\"]\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '23,746', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '23,764', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '23,765', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '23,770', 'INFO', 'Importing untrained models']\n", - "['2020-07-31 08', '46', '23,771', 'INFO', 'Import successful']\n", - "['2020-07-31 08', '46', '23,777', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '23,777', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '23,777', 'INFO', 'Initializing Random Forest']\n", - "['2020-07-31 08', '46', '23,782', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '23,789', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '24,034', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '24,142', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '24,143', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '24,164', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '24,176', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '24,434', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '24,549', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '24,549', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '24,561', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '24,578', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '24,918', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '25,038', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '25,038', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '25,064', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '25,081', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '25,328', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '25,435', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '25,436', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '25,448', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '25,458', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '25,707', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '25,823', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '25,838', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', \"save_model(model=RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '25,900', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '25,932', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '25,987', 'INFO', 'Initializing Extra Trees Regressor']\n", - "['2020-07-31 08', '46', '25,992', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '25,998', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '26,142', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '26,268', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '26,268', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '26,284', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '26,303', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '26,440', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '26,546', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '26,546', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '26,553', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '26,563', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '26,705', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '26,821', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '26,821', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '26,836', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '26,852', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,011', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,117', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,118', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,139', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '27,139', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,295', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '46', '27,421', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '27,421', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '27,436', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '27,502', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '27,502', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '27,503', 'INFO', \"save_model(model=ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '27,503', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '27,523', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '27,539', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), ExtraTreesRegressor(bootstrap=False, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '46', '27,539', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '27,539', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '27,586', 'INFO', 'Initializing AdaBoost Regressor']\n", - "['2020-07-31 08', '46', '27,601', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '27,601', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,633', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '27,647', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,663', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,665', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,665', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,670', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,674', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,689', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '27,689', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,705', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '27,721', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '27,736', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '27,752', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', \"save_model(model=AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '27,799', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), AdaBoostRegressor(base_estimator=None, learning_rate=1.0, loss='linear',\"]\n", - "['n_estimators=50, random_state=123), None]']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '27,814', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '27,846', 'INFO', 'Initializing Gradient Boosting Regressor']\n", - "['2020-07-31 08', '46', '27,846', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '27,861', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '27,924', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '27,924', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '27,924', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '27,939', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '27,939', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,002', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '28,018', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '28,096', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,174', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '28,189', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,252', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,252', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,252', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,267', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '28,267', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '28,267', 'INFO', 'Creating MLFlow logs']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '46', '28,330', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', \"save_model(model=GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '28,330', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False), None]']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '28,346', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '28,408', 'INFO', 'Initializing Extreme Gradient Boosting']\n", - "['2020-07-31 08', '46', '28,408', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '28,424', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,471', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,471', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,471', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,486', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '28,502', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,549', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,549', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,549', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,564', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '28,580', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,611', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,611', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,611', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,627', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '28,642', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,689', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,689', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,689', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,705', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '28,720', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '28,767', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '28,783', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '28,783', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '28,799', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '28,799', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '28,830', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', \"save_model(model=XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '28,939', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0), None]']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '28,955', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '29,017', 'INFO', 'Initializing Light Gradient Boosting Machine']\n", - "['2020-07-31 08', '46', '29,017', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '29,033', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,127', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,127', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,127', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,142', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '29,158', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,252', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,267', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,267', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,283', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '29,283', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,392', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,392', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,392', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,423', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '29,423', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,533', 'INFO', 'Evaluating Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '46', '29,533', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,533', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,548', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '29,564', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '29,658', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '29,673', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '29,673', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '29,689', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '29,689', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '29,720', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', \"save_model(model=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '29,830', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '29,861', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '29,876', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), None]']\n", - "['2020-07-31 08', '46', '29,876', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '29,876', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '29,970', 'INFO', 'Initializing CatBoost Regressor']\n", - "['2020-07-31 08', '46', '29,970', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '29,986', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '31,376', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '31,392', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '31,392', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '31,392', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '31,407', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '32,847', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '32,863', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '32,863', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '32,863', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '32,878', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '34,175', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '34,175', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '34,175', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '34,190', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '34,190', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '35,582', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '35,598', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,028', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,028', 'INFO', 'No inverse transformer found']\n", - "['2020-07-31 08', '46', '37,028', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,043', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '37,043', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '37,059', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'save_model(model=, model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '46', '37,121', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), , None]']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '37,137', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '46', '37,184', 'INFO', 'Finalizing top_n models']\n", - "['2020-07-31 08', '46', '37,184', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'create_model(estimator=xgboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Extreme Gradient Boosting Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '37,200', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,246', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,246', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,246', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,262', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '37,262', 'INFO', 'Fitting Model']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '46', '37,309', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,309', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,309', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,325', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '37,325', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,371', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,371', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,371', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,387', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '37,387', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,434', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,434', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,434', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,449', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '37,449', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,496', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,496', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,496', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,512', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '37,512', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,559', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,559', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,559', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,574', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '37,590', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,621', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,637', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,637', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,653', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '37,653', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,699', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,699', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,699', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,715', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '37,715', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,762', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,762', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,762', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,778', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '37,778', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '37,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '37,840', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '37,840', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '37,856', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '37,856', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '37,871', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'create_model_container', '17']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'master_model_container', '17']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'display_container', '18']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', \"XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "['silent=None, subsample=1, verbosity=0)']\n", - "['2020-07-31 08', '46', '37,934', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'create_model(estimator=gbr, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '37,949', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Gradient Boosting Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '37,981', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '38,121', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '38,231', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,324', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,324', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,324', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,340', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '38,340', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,418', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,418', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,418', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,434', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '38,434', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '38,512', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,590', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,590', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,590', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,605', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '38,605', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '38,683', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '38,762', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '38,840', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '38,918', 'INFO', 'Creating metrics dataframe']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '46', '38,933', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'create_model_container', '18']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'master_model_container', '18']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'display_container', '19']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', \"GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "['validation_fraction=0.1, verbose=0, warm_start=False)']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'create_model(estimator=catboost, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '39,012', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'CatBoost Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '39,027', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '40,292', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '41,620', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '41,620', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '41,620', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '41,636', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '41,636', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '42,979', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '42,995', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '44,323', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '45,653', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '45,653', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '45,653', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '45,669', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '45,669', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '47,181', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '47,181', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '47,181', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '47,197', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '47,197', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '48,509', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '48,509', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '48,509', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '48,524', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '48,524', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '49,928', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '49,939', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '49,940', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '49,953', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '49,955', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '51,527', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '51,530', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '51,530', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '51,540', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '51,542', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '53,254', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '53,260', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '53,260', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '53,270', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '53,272', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '53,276', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '54,768', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '54,768', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '54,768', 'INFO', 'create_model_container', '19']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', 'master_model_container', '19']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', 'display_container', '20']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', '']\n", - "['2020-07-31 08', '46', '54,769', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'create_model(estimator=rf, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '54,775', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '54,786', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '54,787', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '54,787', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '54,788', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '54,788', 'INFO', 'Random Forest Regressor Imported succesfully']\n", - "['2020-07-31 08', '46', '54,789', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '54,790', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '54,792', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '55,056', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '55,173', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '55,173', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '55,183', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '55,185', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '55,444', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '55,568', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '55,811', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '55,932', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '56,191', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '56,303', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '56,303', 'INFO', 'Compiling Metrics']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '46', '56,310', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '56,311', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '56,564', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '56,678', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '56,678', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '56,684', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '56,685', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '56,948', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '57,053', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '57,055', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '57,066', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '57,066', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '57,232', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '57,338', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '57,338', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '57,348', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '57,349', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '57,609', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '57,724', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '57,724', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '57,726', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '57,740', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '57,980', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '58,097', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '58,350', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,456', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,456', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,464', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '58,465', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '58,469', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'create_model_container', '20']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'master_model_container', '20']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'display_container', '21']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', \"RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "['random_state=123, verbose=0, warm_start=False)']\n", - "['2020-07-31 08', '46', '58,727', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'create_model(estimator=lightgbm, ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '46', '58,743', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '46', '58,766', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '46', '58,767', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '46', '58,768', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '46', '58,768', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '46', '58,768', 'INFO', 'Light Gradient Boosting Machine Imported succesfully']\n", - "['2020-07-31 08', '46', '58,769', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '46', '58,770', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '46', '58,772', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '58,848', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,848', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,848', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,864', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '46', '58,864', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '58,926', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '58,942', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '58,942', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '58,942', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '46', '58,958', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,037', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,041', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,041', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,053', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '46', '59,055', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,148', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,152', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,153', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,164', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '46', '59,166', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,250', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,250', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,250', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,265', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '46', '59,265', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,359', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,375', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,375', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,375', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '46', '59,390', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,492', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,497', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,497', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,510', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '46', '59,513', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,629', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,634', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,634', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,649', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '46', '59,652', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,760', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,765', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,765', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,778', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '46', '59,780', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '46', '59,935', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '46', '59,941', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '46', '59,941', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '46', '59,956', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '46', '59,959', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '46', '59,969', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '47', '00,131', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '47', '00,131', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '47', '00,131', 'INFO', 'create_model_container', '21']\n", - "['2020-07-31 08', '47', '00,132', 'INFO', 'master_model_container', '21']\n", - "['2020-07-31 08', '47', '00,132', 'INFO', 'display_container', '22']\n", - "['2020-07-31 08', '47', '00,133', 'INFO', \"LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '47', '00,133', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '00,133', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 08', '47', '00,231', 'INFO', 'create_model_container', '21']\n", - "['2020-07-31 08', '47', '00,231', 'INFO', 'master_model_container', '21']\n", - "['2020-07-31 08', '47', '00,231', 'INFO', 'display_container', '23']\n", - "['2020-07-31 08', '47', '00,233', 'INFO', \"[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)]']\n", - "['2020-07-31 08', '47', '00,233', 'INFO', 'compare_models() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '00,241', 'INFO', 'Initializing stack_models()']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', \"stack_models(estimator_list=[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0)], meta_model=None, fold=10, round=4, restack=True, plot=False, choose_better=False, optimize=R2, finalize=False, verbose=True)']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '00,243', 'INFO', 'Copying estimator list']\n", - "['2020-07-31 08', '47', '00,296', 'INFO', 'Defining meta model']\n", - "['2020-07-31 08', '47', '00,299', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '00,346', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '00,348', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '47', '00,349', 'INFO', 'Getting model names']\n", - "['2020-07-31 08', '47', '00,356', 'INFO', 'Checking base model', 'XGBRegressor']\n", - "['2020-07-31 08', '47', '00,367', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '00,435', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '01,084', 'INFO', 'Checking base model', 'GradientBoostingRegressor']\n", - "['2020-07-31 08', '47', '01,096', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '01,257', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '02,082', 'INFO', 'Checking base model', 'CatBoostRegressor']\n", - "['2020-07-31 08', '47', '02,097', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '03,663', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '24,424', 'INFO', 'Checking base model', 'RandomForestRegressor']\n", - "['2020-07-31 08', '47', '24,430', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '24,814', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '28,106', 'INFO', 'Checking base model', 'LGBMRegressor']\n", - "['2020-07-31 08', '47', '28,120', 'INFO', 'Fitting base model']\n", - "['2020-07-31 08', '47', '28,227', 'INFO', 'Generating cross val predictions']\n", - "['2020-07-31 08', '47', '29,899', 'INFO', 'Base layer complete']\n", - "['2020-07-31 08', '47', '29,916', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '47', '29,919', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '47', '29,935', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '29,942', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '29,948', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '29,990', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '47', '29,999', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,006', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,031', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '47', '30,044', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,052', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,057', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,089', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '47', '30,101', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,108', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,112', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,141', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '47', '30,153', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,158', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,163', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,190', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '47', '30,200', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,206', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,208', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,237', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '47', '30,247', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,253', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,255', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,280', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '47', '30,289', 'INFO', 'Fitting Model']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '47', '30,296', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,300', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,321', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '47', '30,330', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,335', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,338', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,369', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '47', '30,380', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '30,387', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '30,390', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '30,419', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '47', '30,420', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '47', '30,429', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '47', '30,430', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '47', '30,431', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '47', '30,542', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '30,542', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '30,547', 'INFO', \"save_model(model=[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), True], model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '47', '30,547', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '30,631', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '30,651', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "[\"verbose=False), [XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), True], None]']\n", - "['2020-07-31 08', '47', '30,652', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '30,652', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '31,205', 'INFO', 'create_model_container', '22']\n", - "['2020-07-31 08', '47', '31,205', 'INFO', 'master_model_container', '22']\n", - "['2020-07-31 08', '47', '31,205', 'INFO', 'display_container', '24']\n", - "['2020-07-31 08', '47', '31,209', 'INFO', \"[XGBRegressor(base_score=0.5, booster='gbtree', colsample_bylevel=1,\"]\n", - "['colsample_bynode=1, colsample_bytree=1, gamma=0,']\n", - "[\"importance_type='gain', learning_rate=0.1, max_delta_step=0,\"]\n", - "['max_depth=3, min_child_weight=1, missing=None, n_estimators=100,']\n", - "[\"n_jobs=-1, nthread=None, objective='reg\", \"linear', random_state=123,\"]\n", - "['reg_alpha=0, reg_lambda=1, scale_pos_weight=1, seed=None,']\n", - "[\"silent=None, subsample=1, verbosity=0), GradientBoostingRegressor(alpha=0.9, ccp_alpha=0.0, criterion='friedman_mse',\"]\n", - "[\"init=None, learning_rate=0.1, loss='ls', max_depth=3,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0, n_estimators=100,']\n", - "[\"n_iter_no_change=None, presort='deprecated',\"]\n", - "['random_state=123, subsample=1.0, tol=0.0001,']\n", - "[\"validation_fraction=0.1, verbose=0, warm_start=False), , RandomForestRegressor(bootstrap=True, ccp_alpha=0.0, criterion='mse',\"]\n", - "[\"max_depth=None, max_features='auto', max_leaf_nodes=None,\"]\n", - "['max_samples=None, min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None, min_samples_leaf=1,']\n", - "['min_samples_split=2, min_weight_fraction_leaf=0.0,']\n", - "['n_estimators=100, n_jobs=-1, oob_score=False,']\n", - "[\"random_state=123, verbose=0, warm_start=False), LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), LinearRegression(copy_X=True, fit_intercept=True, n_jobs=-1, normalize=False), True]']\n", - "['2020-07-31 08', '47', '31,209', 'INFO', 'stack_models() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '31,222', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '31,223', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=residuals, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '31,223', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '31,224', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '31,224', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '31,239', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '31,240', 'INFO', 'plot type', 'residuals']\n", - "['2020-07-31 08', '47', '31,385', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '31,427', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 08', '47', '32,278', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,279', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,288', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '32,289', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=error, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '32,289', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,289', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '32,290', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '32,300', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,301', 'INFO', 'plot type', 'error']\n", - "['2020-07-31 08', '47', '32,302', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '32,303', 'INFO', 'Scoring test/hold-out set']\n", - "['2020-07-31 08', '47', '32,533', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,533', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,540', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '32,541', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=feature, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '32,541', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,541', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '32,541', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '32,551', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,552', 'INFO', 'plot type', 'feature']\n", - "['2020-07-31 08', '47', '32,696', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,697', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,721', 'INFO', 'Initializing plot_model()']\n", - "['2020-07-31 08', '47', '32,722', 'INFO', \"plot_model(estimator=DecisionTreeRegressor(ccp_alpha=0.0, criterion='mse', max_depth=None,\"]\n", - "['max_features=None, max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0, min_impurity_split=None,']\n", - "['min_samples_leaf=1, min_samples_split=2,']\n", - "[\"min_weight_fraction_leaf=0.0, presort='deprecated',\"]\n", - "[\"random_state=123, splitter='best'), plot=parameter, save=False, verbose=True, system=True)\"]\n", - "['2020-07-31 08', '47', '32,722', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,722', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '32,722', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '32,731', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,732', 'INFO', 'plot type', 'parameter']\n", - "['2020-07-31 08', '47', '32,740', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '32,740', 'INFO', 'plot_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '32,751', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 08', '47', '32,752', 'INFO', \"interpret_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), plot=summary, feature=None, observation=None)']\n", - "['2020-07-31 08', '47', '32,752', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '32,946', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '32,946', 'INFO', 'plot type', 'summary']\n", - "['2020-07-31 08', '47', '32,946', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 08', '47', '33,221', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 08', '47', '33,761', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '33,761', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '33,767', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 08', '47', '33,768', 'INFO', \"interpret_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), plot=correlation, feature=None, observation=None)']\n", - "['2020-07-31 08', '47', '33,768', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '33,769', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '33,769', 'INFO', 'plot type', 'correlation']\n", - "['2020-07-31 08', '47', '33,769', 'WARNING', 'No feature passed. Default value of feature used for correlation plot', 'age']\n", - "['2020-07-31 08', '47', '33,769', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 08', '47', '34,080', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 08', '47', '34,387', 'INFO', 'Visual Rendered Successfully']\n", - "['2020-07-31 08', '47', '34,387', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '34,395', 'INFO', 'Initializing interpret_model()']\n", - "['2020-07-31 08', '47', '34,396', 'INFO', \"interpret_model(estimator=LGBMRegressor(boosting_type='gbdt', class_weight=None, colsample_bytree=1.0,\"]\n", - "[\"importance_type='split', learning_rate=0.1, max_depth=-1,\"]\n", - "['min_child_samples=20, min_child_weight=0.001, min_split_gain=0.0,']\n", - "['n_estimators=100, n_jobs=-1, num_leaves=31, objective=None,']\n", - "['random_state=123, reg_alpha=0.0, reg_lambda=0.0, silent=True,']\n", - "['subsample=1.0, subsample_for_bin=200000, subsample_freq=0), plot=reason, feature=None, observation=12)']\n", - "['2020-07-31 08', '47', '34,396', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '34,397', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '34,397', 'INFO', 'plot type', 'reason']\n", - "['2020-07-31 08', '47', '34,398', 'INFO', 'Creating TreeExplainer']\n", - "['2020-07-31 08', '47', '34,661', 'INFO', 'Compiling shap values']\n", - "['2020-07-31 08', '47', '34,753', 'INFO', 'Visual Rendered Successfully']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '47', '34,754', 'INFO', 'interpret_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '34,811', 'INFO', 'Initializing automl()']\n", - "['2020-07-31 08', '47', '34,812', 'INFO', 'automl(optimize=MAE, use_holdout=False)']\n", - "['2020-07-31 08', '47', '34,812', 'INFO', 'Model Selection Basis', 'CV Results on Training set']\n", - "['2020-07-31 08', '47', '34,820', 'INFO', 'SubProcess finalize_model() called ==================================']\n", - "['2020-07-31 08', '47', '34,821', 'INFO', 'Initializing finalize_model()']\n", - "['2020-07-31 08', '47', '34,822', 'INFO', 'finalize_model(estimator=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123))']\n", - "['2020-07-31 08', '47', '34,822', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '34,822', 'INFO', 'Getting model name']\n", - "['2020-07-31 08', '47', '34,823', 'INFO', 'Finalizing AdaBoost Regressor']\n", - "['2020-07-31 08', '47', '34,883', 'INFO', 'Creating MLFlow logs']\n", - "['2020-07-31 08', '47', '34,935', 'INFO', 'SubProcess create_model() called ==================================']\n", - "['2020-07-31 08', '47', '34,936', 'INFO', 'Initializing create_model()']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'create_model(estimator=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), ensemble=False, method=None, fold=10, round=4, cross_validation=True, verbose=False, system=False)']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'Checking exceptions']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'Preloading libraries']\n", - "['2020-07-31 08', '47', '34,937', 'INFO', 'Preparing display monitor']\n", - "['2020-07-31 08', '47', '34,953', 'INFO', 'Copying training dataset']\n", - "['2020-07-31 08', '47', '34,954', 'INFO', 'Importing libraries']\n", - "['2020-07-31 08', '47', '34,954', 'INFO', 'Defining folds']\n", - "['2020-07-31 08', '47', '34,954', 'INFO', 'Declaring metric variables']\n", - "['2020-07-31 08', '47', '34,955', 'INFO', 'Declaring custom model']\n", - "['2020-07-31 08', '47', '34,956', 'INFO', 'AdaBoost Regressor Imported succesfully']\n", - "['2020-07-31 08', '47', '34,957', 'INFO', 'Checking ensemble method']\n", - "['2020-07-31 08', '47', '34,958', 'INFO', 'Initializing Fold 1']\n", - "['2020-07-31 08', '47', '34,961', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,005', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,008', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,008', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,015', 'INFO', 'Initializing Fold 2']\n", - "['2020-07-31 08', '47', '35,016', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,074', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,078', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,079', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,088', 'INFO', 'Initializing Fold 3']\n", - "['2020-07-31 08', '47', '35,089', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,141', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,145', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,146', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,153', 'INFO', 'Initializing Fold 4']\n", - "['2020-07-31 08', '47', '35,154', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,201', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,204', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,204', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,211', 'INFO', 'Initializing Fold 5']\n", - "['2020-07-31 08', '47', '35,213', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,259', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,262', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,262', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,269', 'INFO', 'Initializing Fold 6']\n", - "['2020-07-31 08', '47', '35,270', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,312', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,316', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,316', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,322', 'INFO', 'Initializing Fold 7']\n", - "['2020-07-31 08', '47', '35,324', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,365', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,369', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,369', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,375', 'INFO', 'Initializing Fold 8']\n", - "['2020-07-31 08', '47', '35,376', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,417', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,420', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,420', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,426', 'INFO', 'Initializing Fold 9']\n", - "['2020-07-31 08', '47', '35,427', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,468', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,471', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,471', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,477', 'INFO', 'Initializing Fold 10']\n", - "['2020-07-31 08', '47', '35,478', 'INFO', 'Fitting Model']\n", - "['2020-07-31 08', '47', '35,518', 'INFO', 'Evaluating Metrics']\n", - "['2020-07-31 08', '47', '35,521', 'INFO', 'No inverse transformation']\n", - "['2020-07-31 08', '47', '35,521', 'INFO', 'Compiling Metrics']\n", - "['2020-07-31 08', '47', '35,527', 'INFO', 'Calculating mean and std']\n", - "['2020-07-31 08', '47', '35,528', 'INFO', 'Creating metrics dataframe']\n", - "['2020-07-31 08', '47', '35,532', 'INFO', 'Finalizing model']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'Uploading results into container']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'Uploading model into container']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'create_model_container', '23']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'master_model_container', '23']\n", - "['2020-07-31 08', '47', '35,575', 'INFO', 'display_container', '25']\n", - "['2020-07-31 08', '47', '35,576', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '35,576', 'INFO', 'create_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,576', 'INFO', 'SubProcess create_model() end ==================================']\n", - "['2020-07-31 08', '47', '35,635', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '35,636', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '35,637', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=Trained Model, verbose=False)']\n", - "['2020-07-31 08', '47', '35,637', 'INFO', 'Appending prep pipeline']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['2020-07-31 08', '47', '35,647', 'INFO', 'Trained Model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '35,653', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '47', '35,653', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,653', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '35,712', 'INFO', 'create_model_container', '23']\n", - "['2020-07-31 08', '47', '35,712', 'INFO', 'master_model_container', '23']\n", - "['2020-07-31 08', '47', '35,712', 'INFO', 'display_container', '25']\n", - "['2020-07-31 08', '47', '35,713', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '35,713', 'INFO', 'finalize_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,713', 'INFO', 'SubProcess finalize_model() end ==================================']\n", - "['2020-07-31 08', '47', '35,714', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '35,715', 'INFO', 'automl() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '35,914', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '35,916', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=best-model, verbose=True)']\n", - "['2020-07-31 08', '47', '35,916', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '35,932', 'INFO', 'best-model.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '35,942', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '47', '35,942', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '36,014', 'INFO', 'Initializing deploy_model()']\n", - "['2020-07-31 08', '47', '36,016', 'INFO', 'deploy_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "[\"random_state=123), model_name=best-aws, authentication={'bucket'\", \"'pycaret-test'}, platform=aws)\"]\n", - "['2020-07-31 08', '47', '36,019', 'INFO', 'Platform', 'AWS S3']\n", - "['2020-07-31 08', '47', '36,202', 'INFO', 'Saving model in active working directory']\n", - "['2020-07-31 08', '47', '36,202', 'INFO', 'SubProcess save_model() called ==================================']\n", - "['2020-07-31 08', '47', '36,203', 'INFO', 'Initializing save_model()']\n", - "['2020-07-31 08', '47', '36,204', 'INFO', 'save_model(model=AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), model_name=best-aws, verbose=False)']\n", - "['2020-07-31 08', '47', '36,204', 'INFO', 'Appending prep pipeline']\n", - "['2020-07-31 08', '47', '36,214', 'INFO', 'best-aws.pkl saved in current working directory']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', '[Pipeline(memory=None,']\n", - "[\"steps=[('dtypes',\"]\n", - "['DataTypes_Auto_infer(categorical_features=[],']\n", - "['display_types=True, features_todrop=[],']\n", - "[\"ml_usecase='regression',\"]\n", - "[\"numerical_features=[], target='charges',\"]\n", - "['time_features=[])),']\n", - "[\"('imputer',\"]\n", - "[\"Simple_Imputer(categorical_strategy='not_available',\"]\n", - "[\"numeric_strategy='mean',\"]\n", - "['target_variable=None)),']\n", - "[\"('new_levels1',\"]\n", - "['New_Catagorical_Levels...']\n", - "[\"('group', Empty()), ('nonliner', Empty()), ('scaling', Empty()),\"]\n", - "[\"('P_transform', Empty()), ('pt_target', Empty()),\"]\n", - "[\"('binn', Empty()), ('rem_outliers', Empty()),\"]\n", - "[\"('cluster_all', Empty()), ('dummy', Dummify(target='charges')),\"]\n", - "[\"('fix_perfect', Empty()), ('clean_names', Clean_Colum_Names()),\"]\n", - "[\"('feature_select', Empty()), ('fix_multi', Empty()),\"]\n", - "[\"('dfs', Empty()), ('pca', Empty())],\"]\n", - "['verbose=False), AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123), None]']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', 'save_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', 'SubProcess save_model() end ==================================']\n", - "['2020-07-31 08', '47', '36,220', 'INFO', 'Initializing S3 client']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'PyCaret Clustering Module']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'version 2.0']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'Initializing setup()']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'USI', '872d']\n", - "['2020-07-31 08', '47', '36,853', 'INFO', 'setup(data=(224, 21), categorical_features=None, categorical_imputation=constant, ordinal_features=None, high_cardinality_features=None,']\n", - "[\"numeric_features=None, numeric_imputation=mean, date_features=None, ignore_features=['Country Name'], normalize=False,\"]\n", - "['normalize_method=zscore, transformation=False, transformation_method=yeo-johnson, handle_unknown_categorical=True, unknown_categorical_method=least_frequent, pca=False, pca_method=linear,']\n", - "['pca_components=None, ignore_low_variance=False, combine_rare_levels=False, rare_level_threshold=0.1, bin_numeric_features=None,']\n", - "['remove_multicollinearity=False, multicollinearity_threshold=0.9, group_features=None,']\n", - "['group_names=None, supervised=False, supervised_target=None, n_jobs=-1, html=True, session_id=123, log_experiment=True,']\n", - "['experiment_name=health1, log_plots=True, log_profile=False, log_data=False, silent=False, verbose=True, profile=False)']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'Checking environment']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'python_version', '3.7.4']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'python_build', \"('default', 'Aug 9 2019 18\", '34', \"13')\"]\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'machine', 'AMD64']\n", - "['2020-07-31 08', '47', '36,854', 'INFO', 'platform', 'Windows-10-10.0.18362-SP0']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Memory', 'svmem(total=17032478720, available=10622828544, percent=37.6, used=6409650176, free=10622828544)']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Physical Core', '4']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Logical Core', '8']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'Checking libraries']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'pd==1.0.5']\n", - "['2020-07-31 08', '47', '36,864', 'INFO', 'numpy==1.18.5']\n", - "['2020-07-31 08', '47', '37,218', 'INFO', 'sklearn==0.23.1']\n", - "['2020-07-31 08', '47', '37,223', 'INFO', 'kmodes==0.10.1']\n", - "['2020-07-31 08', '47', '37,758', 'INFO', 'AdaBoostRegressor(base_estimator=DecisionTreeRegressor(ccp_alpha=0.0,']\n", - "[\"criterion='mse',\"]\n", - "['max_depth=None,']\n", - "['max_features=None,']\n", - "['max_leaf_nodes=None,']\n", - "['min_impurity_decrease=0.0,']\n", - "['min_impurity_split=None,']\n", - "['min_samples_leaf=1,']\n", - "['min_samples_split=2,']\n", - "['min_weight_fraction_leaf=0.0,']\n", - "[\"presort='deprecated',\"]\n", - "['random_state=123,']\n", - "[\"splitter='best'),\"]\n", - "[\"learning_rate=1.0, loss='linear', n_estimators=10,\"]\n", - "['random_state=123)']\n", - "['2020-07-31 08', '47', '37,758', 'INFO', 'deploy_model() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'get_config(variable=X_train)']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'Global variable', 'X_train returned']\n", - "['2020-07-31 08', '47', '37,765', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '47', '37,788', 'INFO', 'get_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,795', 'INFO', 'Initializing set_config()']\n", - "['2020-07-31 08', '47', '37,795', 'INFO', 'set_config(variable=seed, value=999)']\n", - "['2020-07-31 08', '47', '37,795', 'INFO', 'Global variable', 'seed updated']\n", - "['2020-07-31 08', '47', '37,796', 'INFO', 'set_config() succesfully completed......................................']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'Initializing get_config()']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'get_config(variable=seed)']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'Global variable', 'seed returned']\n", - "['2020-07-31 08', '47', '37,801', 'INFO', 'get_config() succesfully completed......................................']\n" - ] - } - ], - "source": [ - "get_system_logs()" - ] - }, - { - "cell_type": "markdown", - "metadata": {}, - "source": [ - "# 17. MLFlow UI" + "# 16. MLFlow UI" ] }, {