add specification for imputer method

chuangw6 · chuangw6 · commit 0894aca2f442 · 2021-02-27T19:30:12.000-08:00
diff --git a/eda_utils_py/eda_utils_py.py b/eda_utils_py/eda_utils_py.py
@@ -1,3 +1,27 @@
+def imputer(dataframe, strategy = "mean", fill_value):
+    """
+    A function to implement imputation functionality for completing missing values.
+
+    Parameters
+    ----------
+    dataframe : pandas.DataFrame
+        a dataframe that might contain missing data
+    strategy : string, default="mean"
+        The imputation strategy.
+        - If “mean”, then replace missing values using the mean along each column. Can only be used with numeric data.
+        - If “median”, then replace missing values using the median along each column. Can only be used with numeric data.
+        - If “most_frequent”, then replace missing using the most frequent value along each column. Can be used with strings or numeric data. If there is more than one such value, only the smallest is returned.
+        - If “constant”, then replace missing values with fill_value. Can be used with strings or numeric data.
+    fill_value : string or numerical value, default=None
+        When strategy == “constant”, fill_value is used to replace all occurrences of missing_values. If left to the default, fill_value will be 0 when imputing numerical data and “missing_value” for strings or object data types.
+        
+    Returns
+    -------
+    pandas.DataFrame 
+        a dataframe that contains no missing data
+    """
+    
+
 def cor_map(dataframe, num_col):
     """
     A function to implement a correlation heatmap including coefficients based on given numeric columns of a data frame.