Autoformat tests

fatse · fatse · commit 3a34a14b4dba · 2021-03-06T08:42:21.000-08:00
diff --git a/tests/test_eda_utils_py.py b/tests/test_eda_utils_py.py
@@ -6,7 +6,6 @@
 import numpy as np
 
 
-
 def test_version():
     assert __version__ == "0.1.0"
 
@@ -188,8 +187,10 @@ def test_scaler():
     )
 
     mock_df_1_standard = pd.DataFrame(
-        {"col1": [-0.3302891295379082, -0.8807710121010884, -0.8807710121010884, 0.7706746355884523, 1.3211565181516325],
-         "col2": [1.714389230829046, -0.26375218935831474, -0.26375218935831474, -0.9231326627541017, -0.26375218935831474],
+        {"col1": [-0.3302891295379082, -0.8807710121010884, -0.8807710121010884, 0.7706746355884523,
+                  1.3211565181516325],
+         "col2": [1.714389230829046, -0.26375218935831474, -0.26375218935831474, -0.9231326627541017,
+                  -0.26375218935831474],
          "col3": [1.0, -1.0, -1.0, 1.0, 0.0]}
     )
 
@@ -233,7 +234,6 @@ def test_scaler():
         minmax_scaled_mock_df_1, mock_df_1_minmax
     ), "The returned dataframe using standard scaler method is not correct"
 
-
     assert pd.DataFrame.equals(
         standard_scaled_mock_df_2, mock_df_2_standard
     ), "The returned dataframe using most_frequent inputer is not correct"
@@ -242,43 +242,47 @@ def test_scaler():
     ), "The returned dataframe using constant imputer is not correct"
 
 
-
 def test_outlier_identifier():
     test_df = pd.DataFrame({
         'SepalLengthCm': [5.1, 4.9, 4.7, 5.5, 5.1, 50, 5.4, 5.0, 5.2, 5.3, 5.1],
         'SepalWidthCm': [1.4, 1.4, 20, 2.0, 0.7, 1.6, 1.2, 1.4, 1.8, 1.5, 2.1],
-        'PetalWidthCm' :[0.2, 0.2, 0.2, 0.3, 0.4, 0.5, 0.5, 0.6, 0.4, 0.2, 5],
-        'Species':['Iris-setosa', 'Iris-virginica', 'Iris-germanica', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa']
+        'PetalWidthCm': [0.2, 0.2, 0.2, 0.3, 0.4, 0.5, 0.5, 0.6, 0.4, 0.2, 5],
+        'Species': ['Iris-setosa', 'Iris-virginica', 'Iris-germanica', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa',
+                    'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa']
     })
 
     test_column = ['SepalLengthCm', 'SepalWidthCm', 'PetalWidthCm']
 
     median_output = pd.DataFrame({
         'SepalLengthCm': [5.1, 4.9, 4.7, 5.5, 5.1, 5.1, 5.4, 5.0, 5.2, 5.3, 5.1],
         'SepalWidthCm': [1.4, 1.4, 1.5, 2.0, 0.7, 1.6, 1.2, 1.4, 1.8, 1.5, 2.1],
-        'PetalWidthCm' :[0.2, 0.2, 0.2, 0.3, 0.4, 0.5, 0.5, 0.6, 0.4, 0.2, 0.4],
-    'Species':['Iris-setosa', 'Iris-virginica', 'Iris-germanica', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa']
+        'PetalWidthCm': [0.2, 0.2, 0.2, 0.3, 0.4, 0.5, 0.5, 0.6, 0.4, 0.2, 0.4],
+        'Species': ['Iris-setosa', 'Iris-virginica', 'Iris-germanica', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa',
+                    'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa']
     })
 
     trim_output = pd.DataFrame({
         'SepalLengthCm': [5.1, 4.9, 5.5, 5.1, 5.4, 5.0, 5.2, 5.3],
         'SepalWidthCm': [1.4, 1.4, 2.0, 0.7, 1.2, 1.4, 1.8, 1.5],
-        'PetalWidthCm' :[0.2, 0.2, 0.3, 0.4, 0.5, 0.6, 0.4, 0.2],
-        'Species':['Iris-setosa', 'Iris-virginica', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa']
+        'PetalWidthCm': [0.2, 0.2, 0.3, 0.4, 0.5, 0.6, 0.4, 0.2],
+        'Species': ['Iris-setosa', 'Iris-virginica', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa',
+                    'Iris-setosa', 'Iris-setosa']
     })
 
     mean_output = pd.DataFrame({
         'SepalLengthCm': [5.1, 4.9, 4.7, 5.5, 5.1, 9.21, 5.4, 5.0, 5.2, 5.3, 5.1],
         'SepalWidthCm': [1.4, 1.4, 3.19, 2.0, 0.7, 1.6, 1.2, 1.4, 1.8, 1.5, 2.1],
-        'PetalWidthCm' :[0.2, 0.2, 0.2, 0.3, 0.4, 0.5, 0.5, 0.6, 0.4, 0.2, 0.77],
-        'Species':['Iris-setosa', 'Iris-virginica', 'Iris-germanica', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa']
+        'PetalWidthCm': [0.2, 0.2, 0.2, 0.3, 0.4, 0.5, 0.5, 0.6, 0.4, 0.2, 0.77],
+        'Species': ['Iris-setosa', 'Iris-virginica', 'Iris-germanica', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa',
+                    'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa']
     })
 
-    column_output= pd.DataFrame({
+    column_output = pd.DataFrame({
         'SepalLengthCm': [5.1, 4.9, 4.7, 5.5, 5.1, 9.21, 5.4, 5.0, 5.2, 5.3, 5.1],
         'SepalWidthCm': [1.4, 1.4, 20, 2.0, 0.7, 1.6, 1.2, 1.4, 1.8, 1.5, 2.1],
-        'PetalWidthCm' :[0.2, 0.2, 0.2, 0.3, 0.4, 0.5, 0.5, 0.6, 0.4, 0.2, 5],
-        'Species':['Iris-setosa', 'Iris-virginica', 'Iris-germanica', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa']
+        'PetalWidthCm': [0.2, 0.2, 0.2, 0.3, 0.4, 0.5, 0.5, 0.6, 0.4, 0.2, 5],
+        'Species': ['Iris-setosa', 'Iris-virginica', 'Iris-germanica', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa',
+                    'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa', 'Iris-setosa']
     })
 
     # Test if the imput is not dataFrame
@@ -295,7 +299,7 @@ def test_outlier_identifier():
 
     # Test if method input is not one of three methods provided
     with raises(Exception):
-        eda_utils_py.outlier_identifier(test_df, columns=["SepalLengthCm"], method = "no")
+        eda_utils_py.outlier_identifier(test_df, columns=["SepalLengthCm"], method="no")
 
     # Test if column selected included non-numeric columns
     with raises(Exception):
@@ -305,12 +309,11 @@ def test_outlier_identifier():
         eda_utils_py.outlier_identifier(test_df, test_column), trim_output
     ), "Default test not pass"
     assert pd.DataFrame.equals(
-        eda_utils_py.outlier_identifier(test_df, test_column,method = "median"), median_output
+        eda_utils_py.outlier_identifier(test_df, test_column, method="median"), median_output
     ), "The median method is not correct"
     assert pd.DataFrame.equals(
-        eda_utils_py.outlier_identifier(test_df, test_column, method = "mean"), mean_output
+        eda_utils_py.outlier_identifier(test_df, test_column, method="mean"), mean_output
     ), "The mean method is not correct"
     assert pd.DataFrame.equals(
-        eda_utils_py.outlier_identifier(test_df, columns = ["SepalLengthCm"], method = "mean"), column_output
+        eda_utils_py.outlier_identifier(test_df, columns=["SepalLengthCm"], method="mean"), column_output
     ), "The selected column method is not correct"
-