Models container, trained and evaluated several models

wtsimple · wtsimple · commit 176de26b4198 · 2020-07-29T09:36:54.000-04:00
diff --git a/models_container.py b/models_container.py
@@ -69,7 +69,7 @@ def _wrap_models(self):
     @property
     def _all_models_dict(self):
         return {name: obj for name, obj in self.__dict__.items()
-                if self.model_path in str(obj.__class__)}
+                if self.model_path in str(obj.__class__) or isinstance(obj, Model)}
 
 
     def _get_models_of_kind(self, kind):
diff --git a/tests/test_model_evaluator.py b/tests/test_model_evaluator.py
@@ -4,6 +4,7 @@
 import pytest
 from pyspark.mllib.evaluation import BinaryClassificationMetrics
 
+from data_preprocessor import DataPreprocessor
 from model_evaluator import ModelEvaluator
 from models_container import ModelsContainer, ModelKinds
 
@@ -28,17 +29,30 @@ def test_model_evaluator_with_linear_regression_and_full_train_data(logistic_mod
 
 
 def test_several_classification_models_fitting(preprocessor_train_data):
-    preprocessor_train_data.prepare_to_model(target_col='income', to_strip=' .')
-    evaluator = ModelEvaluator(metrics_class=BinaryClassificationMetrics)
+    df = preprocessor_train_data.train_df.sample(0.1)
+    preprocessor = DataPreprocessor(train_df=df, test_df=df)
+    preprocessor.prepare_to_model(target_col='income', to_strip=' .')
+
     models = ModelsContainer()
-    models.fit(preprocessor_train_data.train_encoded_df, kind=ModelKinds.CLASSIFICATION)
-    evaluator.compare({"train": preprocessor_train_data.train_encoded_df}, models=models.fitted_models)
-    print('kk')
+    models.fit(preprocessor.train_encoded_df, kind=ModelKinds.CLASSIFICATION)
+    expected_results = [
+        {"model": models.logistic_class.fitted_model,
+         "metrics": {"areaUnderROC": 0.770414, "areaUnderPR": 0.646093}, },
+        {"model": models.random_forest_class.fitted_model,
+         "metrics": {"areaUnderROC": 0.674751, "areaUnderPR": 0.664931}, },
+        {"model": models.gbt_class.fitted_model,
+         "metrics": {"areaUnderROC": 0.811643, "areaUnderPR": 0.746147}, },
+        {"model": models.svm_class.fitted_model,
+         "metrics": {"areaUnderROC": 0.750627, "areaUnderPR": 0.645328}, },
+        {"model": models.naive_bayes_class.fitted_model,
+         "metrics": {"areaUnderROC": 0.615000, "areaUnderPR": 0.504709}, },
+    ]
+    for result in expected_results:
+        _check_evaluation(preprocessor=preprocessor, model=result["model"], metrics=result["metrics"])
 
 
 def _check_evaluation(preprocessor, model, metrics: Dict[str, float]):
-    metrics_class = BinaryClassificationMetrics
-    evaluator = ModelEvaluator(metrics_class=metrics_class)
+    evaluator = ModelEvaluator(metrics_class=BinaryClassificationMetrics)
     # The purpose of this parameter is to prove names can be arbitrary in the compare method
     dataframes_sets = [['train', 'test'], ['train1', 'test1']]
     for dataframes in dataframes_sets:
@@ -51,4 +65,5 @@ def _check_evaluation(preprocessor, model, metrics: Dict[str, float]):
         for metric in metrics:
             assert metric in comparison
             for dataframe in dataframes:
-                assert comparison[metric][evaluator.index_key(dataframe, model)] == pytest.approx(metrics[metric])
+                assert comparison[metric][evaluator.index_key(dataframe, model)] == pytest.approx(metrics[metric],
+                                                                                                  abs=0.035)
diff --git a/todo_list.md b/todo_list.md
@@ -14,10 +14,10 @@
     - [x] prepare the data frame by applying all transformations 
     (cleaning, encoding, etc)        
 - [x] obtain evaluation metrics for a single model
-- [ ] **fit and compare several classification models without tuning**
+- [x] fit and compare several classification models without tuning
     - [x] create an object container for the models
     - [x] initialize the models with default hyperparameters
-    - [ ] fit and compare the results with the evaluator
+    - [x] fit and compare the results with the evaluator
 - [ ] fit and compare several classification models with tuning and crossvalidation
     - [ ] be able to pass a list of hyperparameters values for each hyperparameter
     - [ ] tune and obtain the best hyperparam set per model