From 393052b17fdb9f63a9e428da0039b76237d7607c Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sun, 27 Dec 2020 22:48:32 -0500
Subject: [PATCH 01/98] init

---
 evalml/pipelines/components/estimators/estimator.py     | 6 ++----
 evalml/pipelines/components/transformers/transformer.py | 9 +++++----
 2 files changed, 7 insertions(+), 8 deletions(-)

diff --git a/evalml/pipelines/components/estimators/estimator.py b/evalml/pipelines/components/estimators/estimator.py
index 1ad9e98455..840dbe7f83 100644
--- a/evalml/pipelines/components/estimators/estimator.py
+++ b/evalml/pipelines/components/estimators/estimator.py
@@ -43,8 +43,7 @@ def predict(self, X):
             predictions = self._component_obj.predict(X)
         except AttributeError:
             raise MethodPropertyNotFoundError("Estimator requires a predict method or a component_obj that implements predict")
-        if not isinstance(predictions, pd.Series):
-            predictions = pd.Series(predictions)
+        predictions = _convert_to_woodwork_structure(predictions)
         return predictions
 
     def predict_proba(self, X):
@@ -62,8 +61,7 @@ def predict_proba(self, X):
             pred_proba = self._component_obj.predict_proba(X)
         except AttributeError:
             raise MethodPropertyNotFoundError("Estimator requires a predict_proba method or a component_obj that implements predict_proba")
-        if not isinstance(pred_proba, pd.DataFrame):
-            pred_proba = pd.DataFrame(pred_proba)
+        pred_proba = _convert_to_woodwork_structure(pred_proba)
         return pred_proba
 
     @property
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 51d2c7a4dd..4727e34882 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -4,6 +4,7 @@
 from evalml.model_family import ModelFamily
 from evalml.pipelines.components import ComponentBase
 
+from evalml.utils.gen_utils import _convert_to_woodwork_structure
 
 class Transformer(ComponentBase):
     """A component that may or may not need fitting that transforms data.
@@ -34,8 +35,8 @@ def transform(self, X, y=None):
         except AttributeError:
             raise MethodPropertyNotFoundError("Transformer requires a transform method or a component_obj that implements transform")
         if not isinstance(X_t, pd.DataFrame) and isinstance(X, pd.DataFrame):
-            return pd.DataFrame(X_t, columns=X.columns, index=X.index)
-        return pd.DataFrame(X_t)
+            return _convert_to_woodwork_structure(pd.DataFrame(X_t, columns=X.columns, index=X.index))
+        return _convert_to_woodwork_structure(X_t)
 
     def fit_transform(self, X, y=None):
         """Fits on X and transforms X
@@ -56,5 +57,5 @@ def fit_transform(self, X, y=None):
                 raise e
 
         if not isinstance(X_t, pd.DataFrame) and isinstance(X, pd.DataFrame):
-            return pd.DataFrame(X_t, columns=X.columns, index=X.index)
-        return pd.DataFrame(X_t)
+            return _convert_to_woodwork_structure(pd.DataFrame(X_t, columns=X.columns, index=X.index))
+        return _convert_to_woodwork_structure(X_t)

From 2746e74e26c64a1dd84a05deb3b9d49ace854dd3 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 7 Jan 2021 21:06:35 -0500
Subject: [PATCH 02/98] updated imputer init, starting to update tests...

---
 .../transformers/imputers/imputer.py          |  3 +-
 .../transformers/imputers/simple_imputer.py   |  6 ++-
 evalml/tests/component_tests/test_imputer.py  | 46 +++++++++----------
 .../component_tests/test_simple_imputer.py    | 44 +++++++++---------
 4 files changed, 52 insertions(+), 47 deletions(-)

diff --git a/evalml/pipelines/components/transformers/imputers/imputer.py b/evalml/pipelines/components/transformers/imputers/imputer.py
index b801c942bd..ed4d6fa776 100644
--- a/evalml/pipelines/components/transformers/imputers/imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/imputer.py
@@ -101,6 +101,7 @@ def transform(self, X, y=None):
         X_null_dropped = X.copy()
         X_null_dropped.drop(self._all_null_cols, inplace=True, axis=1, errors='ignore')
         if X_null_dropped.empty:
+            X_null_dropped = _convert_to_woodwork_structure(X_null_dropped)
             return X_null_dropped
 
         if self._numeric_cols is not None and len(self._numeric_cols) > 0:
@@ -114,5 +115,5 @@ def transform(self, X, y=None):
             imputed = self._categorical_imputer.transform(X_categorical)
             imputed.index = X_null_dropped.index
             X_null_dropped[X_categorical.columns] = imputed
-
+        X_null_dropped = _convert_to_woodwork_structure(X_null_dropped)
         return X_null_dropped
diff --git a/evalml/pipelines/components/transformers/imputers/simple_imputer.py b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
index 24751d7af9..82fb641ac4 100644
--- a/evalml/pipelines/components/transformers/imputers/simple_imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
@@ -77,16 +77,20 @@ def transform(self, X, y=None):
 
         # Return early since bool dtype doesn't support nans and sklearn errors if all cols are bool
         if (X.dtypes == bool).all():
+            X = _convert_to_woodwork_structure(X)
             return X
         X_null_dropped = X.copy()
         X_null_dropped.drop(self._all_null_cols, axis=1, errors='ignore', inplace=True)
         category_cols = X_null_dropped.select_dtypes(include=['category']).columns
         X_t = self._component_obj.transform(X)
         if X_null_dropped.empty:
-            return pd.DataFrame(X_t, columns=X_null_dropped.columns)
+            X_t = pd.DataFrame(X_t, columns=X_null_dropped.columns)
+            X_t = _convert_to_woodwork_structure(X_t)
+            return X_t
         X_t = pd.DataFrame(X_t, columns=X_null_dropped.columns)
         if len(category_cols) > 0:
             X_t[category_cols] = X_t[category_cols].astype('category')
+        X_t = _convert_to_woodwork_structure(X_t)
         return X_t
 
     def fit_transform(self, X, y=None):
diff --git a/evalml/tests/component_tests/test_imputer.py b/evalml/tests/component_tests/test_imputer.py
index 74dabaa138..d660fb00c6 100644
--- a/evalml/tests/component_tests/test_imputer.py
+++ b/evalml/tests/component_tests/test_imputer.py
@@ -79,11 +79,11 @@ def test_numeric_only_input(imputer_test_data):
         "int with nan": [0.5, 1.0, 0.0, 0.0, 1.0],
         "float with nan": [0.0, 1.0, 0, -1.0, 0.]
     })
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
     imputer = Imputer()
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
 
 def test_categorical_only_input(imputer_test_data):
@@ -105,7 +105,7 @@ def test_categorical_only_input(imputer_test_data):
 
     imputer = Imputer()
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
 
 def test_categorical_and_numeric_input(imputer_test_data):
@@ -126,11 +126,11 @@ def test_categorical_and_numeric_input(imputer_test_data):
         "object with nan": pd.Series(["b", "b", "b", "c", "b"], dtype='category'),
         "bool col with nan": [True, True, False, True, True]
     })
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
     imputer = Imputer()
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
 
 def test_drop_all_columns(imputer_test_data):
@@ -140,11 +140,11 @@ def test_drop_all_columns(imputer_test_data):
     imputer.fit(X, y)
     transformed = imputer.transform(X, y)
     expected = X.drop(["all nan cat", "all nan"], axis=1)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
     imputer = Imputer()
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
 
 def test_typed_imputer_numpy_input():
@@ -158,11 +158,11 @@ def test_typed_imputer_numpy_input():
     expected = pd.DataFrame(np.array([[1, 2, 2, 0],
                                       [1, 0, 0, 0],
                                       [1, 1, 1, 0]]))
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
     imputer = Imputer()
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
 
 def test_imputer_datetime_input():
@@ -175,11 +175,11 @@ def test_imputer_datetime_input():
     imputer = Imputer()
     imputer.fit(X, y)
     transformed = imputer.transform(X, y)
-    assert_frame_equal(transformed, X, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), X, check_dtype=False)
 
     imputer = Imputer()
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, X, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), X, check_dtype=False)
 
 
 @pytest.mark.parametrize("data_type", ['np', 'pd', 'ww'])
@@ -199,11 +199,11 @@ def test_imputer_empty_data(data_type):
     imputer = Imputer()
     imputer.fit(X, y)
     transformed = imputer.transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
     imputer = Imputer()
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
 
 def test_imputer_does_not_reset_index():
@@ -219,7 +219,7 @@ def test_imputer_does_not_reset_index():
     imputer = Imputer()
     imputer.fit(X, y=y)
     transformed = imputer.transform(X)
-    pd.testing.assert_frame_equal(transformed,
+    pd.testing.assert_frame_equal(transformed.to_dataframe(),
                                   pd.DataFrame({'input_val': [1.0, 2, 3, 4, 5, 6, 7, 8, 9],
                                                 'input_cat': pd.Categorical(['a'] * 6 + ['b'] * 3)},
                                                index=list(range(1, 10))))
@@ -240,12 +240,12 @@ def test_imputer_fill_value(imputer_test_data):
         "object with nan": pd.Series(["b", "b", "fill", "c", "fill"], dtype='category'),
         "bool col with nan": [True, "fill", False, "fill", True]
     })
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
     imputer = Imputer(categorical_impute_strategy="constant", numeric_impute_strategy="constant",
                       categorical_fill_value="fill", numeric_fill_value=-1)
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
 
 def test_imputer_no_nans(imputer_test_data):
@@ -260,12 +260,12 @@ def test_imputer_no_nans(imputer_test_data):
         "object col": pd.Series(["b", "b", "a", "c", "d"], dtype='category'),
         "bool col": [True, False, False, True, True],
     })
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
     imputer = Imputer(categorical_impute_strategy="constant", numeric_impute_strategy="constant",
                       categorical_fill_value="fill", numeric_fill_value=-1)
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
 
 def test_imputer_with_none():
@@ -284,11 +284,11 @@ def test_imputer_with_none():
                              "category with None": pd.Series(["b", "a", "a", "a"], dtype='category'),
                              "boolean with None": [True, True, False, True],
                              "object with None": pd.Series(["b", "a", "a", "a"], dtype='category')})
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
     imputer = Imputer()
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
@@ -302,7 +302,7 @@ def test_imputer_all_bool_return_original(data_type):
     imputer = Imputer()
     imputer.fit(X, y)
     X_t = imputer.transform(X)
-    assert_frame_equal(X_expected_arr, X_t)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe())
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
@@ -315,7 +315,7 @@ def test_imputer_bool_dtype_object(data_type, make_data_type):
     imputer = Imputer()
     imputer.fit(X, y)
     X_t = imputer.transform(X)
-    assert_frame_equal(X_expected_arr, X_t)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe())
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
@@ -335,4 +335,4 @@ def test_imputer_multitype_with_one_bool(data_type):
     imputer = Imputer()
     imputer.fit(X_multi, y)
     X_multi_t = imputer.transform(X_multi)
-    assert_frame_equal(X_multi_expected_arr, X_multi_t)
+    assert_frame_equal(X_multi_expected_arr, X_multi_t.to_dataframe())
diff --git a/evalml/tests/component_tests/test_simple_imputer.py b/evalml/tests/component_tests/test_simple_imputer.py
index 43843ec1ba..7cc3d398cd 100644
--- a/evalml/tests/component_tests/test_simple_imputer.py
+++ b/evalml/tests/component_tests/test_simple_imputer.py
@@ -20,7 +20,7 @@ def test_simple_imputer_median():
                                    [10, 2, 5, 2],
                                    [6, 2, 7, 0]])
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected_arr, X_t, check_dtype=False)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe(), check_dtype=False)
 
 
 def test_simple_imputer_mean():
@@ -33,7 +33,7 @@ def test_simple_imputer_mean():
                                    [1, 2, 3, 2],
                                    [1, 2, 3, 0]])
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected_arr, X_t, check_dtype=False)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe(), check_dtype=False)
 
 
 def test_simple_imputer_constant():
@@ -48,7 +48,7 @@ def test_simple_imputer_constant():
                                    ["b", 2, 3, 0]])
     X_expected_arr = X_expected_arr.astype({0: 'category'})
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected_arr, X_t, check_dtype=False)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe(), check_dtype=False)
 
 
 def test_simple_imputer_most_frequent():
@@ -62,7 +62,7 @@ def test_simple_imputer_most_frequent():
                                    ["b", 2, 1, 0]])
     X_expected_arr = X_expected_arr.astype({0: 'category'})
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected_arr, X_t, check_dtype=False)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe(), check_dtype=False)
 
 
 def test_simple_imputer_col_with_non_numeric():
@@ -91,7 +91,7 @@ def test_simple_imputer_col_with_non_numeric():
                                    ["a", 2, 3, 0]])
     X_expected_arr = X_expected_arr.astype({0: 'category'})
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected_arr, X_t, check_dtype=False)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe(), check_dtype=False)
 
     transformer = SimpleImputer(impute_strategy='constant', fill_value=2)
     X_expected_arr = pd.DataFrame([["a", 0, 1, 2],
@@ -100,7 +100,7 @@ def test_simple_imputer_col_with_non_numeric():
                                    [2, 2, 3, 0]])
     X_expected_arr = X_expected_arr.astype({0: 'category'})
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected_arr, X_t, check_dtype=False)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe(), check_dtype=False)
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
@@ -113,20 +113,20 @@ def test_simple_imputer_all_bool_return_original(data_type, make_data_type):
     imputer = SimpleImputer()
     imputer.fit(X, y)
     X_t = imputer.transform(X)
-    assert_frame_equal(X_expected_arr, X_t)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe())
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
 def test_simple_imputer_bool_dtype_object(data_type):
     X = pd.DataFrame([True, np.nan, False, np.nan, True], dtype=object)
     y = pd.Series([1, 0, 0, 1, 0])
-    X_expected_arr = pd.DataFrame([True, True, False, True, True], dtype='category')
+    X_expected_arr = pd.DataFrame([True, True, False, True, True], dtype='boolean')
     if data_type == 'ww':
         X = ww.DataTable(X)
     imputer = SimpleImputer()
     imputer.fit(X, y)
     X_t = imputer.transform(X)
-    assert_frame_equal(X_expected_arr, X_t)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe())
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
@@ -145,7 +145,7 @@ def test_simple_imputer_multitype_with_one_bool(data_type):
     imputer = SimpleImputer()
     imputer.fit(X_multi, y)
     X_multi_t = imputer.transform(X_multi)
-    assert_frame_equal(X_multi_expected_arr, X_multi_t)
+    assert_frame_equal(X_multi_expected_arr, X_multi_t.to_dataframe())
 
 
 def test_simple_imputer_fit_transform_drop_all_nan_columns():
@@ -156,7 +156,7 @@ def test_simple_imputer_fit_transform_drop_all_nan_columns():
     transformer = SimpleImputer(impute_strategy='most_frequent')
     X_expected_arr = pd.DataFrame({"some_nan": [0, 1, 0], "another_col": [0, 1, 2]})
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected_arr, X_t, check_dtype=False)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe(), check_dtype=False)
     assert_frame_equal(X, pd.DataFrame({"all_nan": [np.nan, np.nan, np.nan],
                                         "some_nan": [np.nan, 1, 0],
                                         "another_col": [0, 1, 2]}))
@@ -169,7 +169,7 @@ def test_simple_imputer_transform_drop_all_nan_columns():
     transformer = SimpleImputer(impute_strategy='most_frequent')
     transformer.fit(X)
     X_expected_arr = pd.DataFrame({"some_nan": [0, 1, 0], "another_col": [0, 1, 2]})
-    assert_frame_equal(X_expected_arr, transformer.transform(X), check_dtype=False)
+    assert_frame_equal(X_expected_arr, transformer.transform(X).to_dataframe(), check_dtype=False)
     assert_frame_equal(X, pd.DataFrame({"all_nan": [np.nan, np.nan, np.nan],
                                         "some_nan": [np.nan, 1, 0],
                                         "another_col": [0, 1, 2]}))
@@ -178,12 +178,12 @@ def test_simple_imputer_transform_drop_all_nan_columns():
 def test_simple_imputer_transform_drop_all_nan_columns_empty():
     X = pd.DataFrame([[np.nan, np.nan, np.nan]])
     transformer = SimpleImputer(impute_strategy='most_frequent')
-    assert transformer.fit_transform(X).empty
+    assert transformer.fit_transform(X).to_dataframe().empty
     assert_frame_equal(X, pd.DataFrame([[np.nan, np.nan, np.nan]]))
 
     transformer = SimpleImputer(impute_strategy='most_frequent')
     transformer.fit(X)
-    assert transformer.transform(X).empty
+    assert transformer.transform(X).to_dataframe().empty
     assert_frame_equal(X, pd.DataFrame([[np.nan, np.nan, np.nan]]))
 
 
@@ -195,7 +195,7 @@ def test_simple_imputer_numpy_input():
     X_expected_arr = np.array([[0, 1, 1],
                                [2, 3, 2],
                                [2, 3, 0]])
-    assert np.allclose(X_expected_arr, transformer.fit_transform(X))
+    assert np.allclose(X_expected_arr, transformer.fit_transform(X).to_dataframe())
     np.testing.assert_almost_equal(X, np.array([[np.nan, 0, 1, np.nan],
                                                 [np.nan, 2, 3, 2],
                                                 [np.nan, 2, 3, 0]]))
@@ -227,11 +227,11 @@ def test_simple_imputer_fill_value(data_type):
     imputer = SimpleImputer(impute_strategy="constant", fill_value=fill_value)
     imputer.fit(X, y)
     transformed = imputer.transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(expected, transformed.to_dataframe(), check_dtype=False)
 
     imputer = SimpleImputer(impute_strategy="constant", fill_value=fill_value)
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(expected, transformed.to_dataframe(), check_dtype=False)
 
 
 def test_simple_imputer_resets_index():
@@ -249,10 +249,10 @@ def test_simple_imputer_resets_index():
     imputer = SimpleImputer(impute_strategy="mean")
     imputer.fit(X, y=y)
     transformed = imputer.transform(X)
-    pd.testing.assert_frame_equal(transformed,
-                                  pd.DataFrame({'input_val': [1.0, 2, 3, 4, 5, 6, 7, 8, 9]},
+    pd.testing.assert_frame_equal(pd.DataFrame({'input_val': [1.0, 2, 3, 4, 5, 6, 7, 8, 9]},
                                                dtype=float,
-                                               index=list(range(0, 9))))
+                                               index=list(range(0, 9))),
+                                  transformed.to_dataframe())
 
 
 def test_simple_imputer_with_none():
@@ -265,7 +265,7 @@ def test_simple_imputer_with_none():
     transformed = imputer.transform(X, y)
     expected = pd.DataFrame({"int with None": [1, 0, 5, 2],
                              "float with None": [0.1, 0.0, 0.5, 0.2]})
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(expected, transformed.to_dataframe(), check_dtype=False)
 
     X = pd.DataFrame({"category with None": pd.Series(["b", "a", "a", None], dtype='category'),
                       "boolean with None": [True, None, False, True],
@@ -278,4 +278,4 @@ def test_simple_imputer_with_none():
     expected = pd.DataFrame({"category with None": pd.Series(["b", "a", "a", "a"], dtype='category'),
                              "boolean with None": pd.Series([True, True, False, True], dtype='category'),
                              "object with None": pd.Series(["b", "a", "a", "a"], dtype='category')})
-    assert_frame_equal(transformed, expected, check_dtype=False)
+    assert_frame_equal(expected, transformed.to_dataframe(), check_dtype=False)

From 1aee7f4c58d5e40cc6318b95ebbf8ea259c5a4c8 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 8 Jan 2021 15:18:05 -0500
Subject: [PATCH 03/98] what a mess! messing around with simpleimputer logic
 and type inference

---
 docs/source/release_notes.rst                            | 2 ++
 .../components/transformers/imputers/simple_imputer.py   | 9 ++++-----
 evalml/tests/component_tests/test_simple_imputer.py      | 6 +++---
 3 files changed, 9 insertions(+), 8 deletions(-)

diff --git a/docs/source/release_notes.rst b/docs/source/release_notes.rst
index e5b4984c9c..1434f270ca 100644
--- a/docs/source/release_notes.rst
+++ b/docs/source/release_notes.rst
@@ -26,6 +26,7 @@ Release Notes
     * Changes
         * Added labeling to ``graph_confusion_matrix`` :pr:`1632`
         * Rerunning search for ``AutoMLSearch`` results in a message thrown rather than failing the search, and removed ``has_searched`` property :pr:`1647`
+        * Updated components and pipelines to return ``Woodwork`` data structures :pr:`1668`
     * Documentation Changes
         * Updated docs to include information about ``AutoMLSearch`` callback parameters and methods :pr:`1577`
         * Updated docs to prompt users to install graphiz on Mac :pr:`1656`
@@ -35,6 +36,7 @@ Release Notes
 
     **Breaking Changes**
         * Removed ``has_searched`` property from ``AutoMLSearch`` :pr:`1647`
+        * Components and pipelines return ``Woodwork`` data structures instead of pandas data structures :pr:`1668`
 
 **v0.17.0 Dec. 29, 2020**
     * Enhancements
diff --git a/evalml/pipelines/components/transformers/imputers/simple_imputer.py b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
index 82fb641ac4..f503d6ebe8 100644
--- a/evalml/pipelines/components/transformers/imputers/simple_imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
@@ -47,7 +47,6 @@ def fit(self, X, y=None):
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
-
         # Convert all bool dtypes to category for fitting
         if (X.dtypes == bool).all():
             X = X.astype('category')
@@ -73,8 +72,7 @@ def transform(self, X, y=None):
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         # Convert None to np.nan, since None cannot be properly handled
-        X = X.fillna(value=np.nan)
-
+        X = X.fillna(value=np.nan) # with woodwork, do we need this?
         # Return early since bool dtype doesn't support nans and sklearn errors if all cols are bool
         if (X.dtypes == bool).all():
             X = _convert_to_woodwork_structure(X)
@@ -88,8 +86,9 @@ def transform(self, X, y=None):
             X_t = _convert_to_woodwork_structure(X_t)
             return X_t
         X_t = pd.DataFrame(X_t, columns=X_null_dropped.columns)
-        if len(category_cols) > 0:
-            X_t[category_cols] = X_t[category_cols].astype('category')
+        X_t = X_t.infer_objects()
+        # if len(category_cols) > 0:
+        #     X_t[category_cols] = X_t[category_cols].astype('category')
         X_t = _convert_to_woodwork_structure(X_t)
         return X_t
 
diff --git a/evalml/tests/component_tests/test_simple_imputer.py b/evalml/tests/component_tests/test_simple_imputer.py
index 7cc3d398cd..8e8687d912 100644
--- a/evalml/tests/component_tests/test_simple_imputer.py
+++ b/evalml/tests/component_tests/test_simple_imputer.py
@@ -137,8 +137,8 @@ def test_simple_imputer_multitype_with_one_bool(data_type):
     })
     y = pd.Series([1, 0, 0, 1, 0])
     X_multi_expected_arr = pd.DataFrame({
-        "bool with nan": pd.Series([True, False, False, False, False], dtype='category'),
-        "bool no nan": pd.Series([False, False, False, False, True], dtype=object),
+        "bool with nan": pd.Series([True, False, False, False, False], dtype='boolean'),
+        "bool no nan": pd.Series([False, False, False, False, True], dtype='boolean'),
     })
     if data_type == 'ww':
         X_multi = ww.DataTable(X_multi)
@@ -276,6 +276,6 @@ def test_simple_imputer_with_none():
     imputer.fit(X, y)
     transformed = imputer.transform(X, y)
     expected = pd.DataFrame({"category with None": pd.Series(["b", "a", "a", "a"], dtype='category'),
-                             "boolean with None": pd.Series([True, True, False, True], dtype='category'),
+                             "boolean with None": pd.Series([True, True, False, True], dtype='boolean'),
                              "object with None": pd.Series(["b", "a", "a", "a"], dtype='category')})
     assert_frame_equal(expected, transformed.to_dataframe(), check_dtype=False)

From d311015744565195c9284e64f6d899a2b1bebcee Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 8 Jan 2021 16:23:37 -0500
Subject: [PATCH 04/98] clean up imputer tests

---
 .../components/estimators/estimator.py        |  2 --
 .../transformers/imputers/imputer.py          |  8 +++----
 .../transformers/imputers/simple_imputer.py   |  6 +++--
 .../components/transformers/transformer.py    |  5 ++--
 evalml/tests/component_tests/test_imputer.py  | 24 +++++++++----------
 .../component_tests/test_simple_imputer.py    |  2 +-
 6 files changed, 22 insertions(+), 25 deletions(-)

diff --git a/evalml/pipelines/components/estimators/estimator.py b/evalml/pipelines/components/estimators/estimator.py
index 1cf9a21f11..ec6e2d3a93 100644
--- a/evalml/pipelines/components/estimators/estimator.py
+++ b/evalml/pipelines/components/estimators/estimator.py
@@ -1,7 +1,5 @@
 from abc import abstractmethod
 
-import pandas as pd
-
 from evalml.exceptions import MethodPropertyNotFoundError
 from evalml.pipelines.components import ComponentBase
 from evalml.utils.gen_utils import (
diff --git a/evalml/pipelines/components/transformers/imputers/imputer.py b/evalml/pipelines/components/transformers/imputers/imputer.py
index ed4d6fa776..3107909427 100644
--- a/evalml/pipelines/components/transformers/imputers/imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/imputer.py
@@ -106,14 +106,14 @@ def transform(self, X, y=None):
 
         if self._numeric_cols is not None and len(self._numeric_cols) > 0:
             X_numeric = X_null_dropped[self._numeric_cols]
-            imputed = self._numeric_imputer.transform(X_numeric)
-            imputed.index = X_null_dropped.index
+            imputed = self._numeric_imputer.transform(X_numeric).to_dataframe()
+            # imputed.index = X_null_dropped.index
             X_null_dropped[X_numeric.columns] = imputed
 
         if self._categorical_cols is not None and len(self._categorical_cols) > 0:
             X_categorical = X_null_dropped[self._categorical_cols]
-            imputed = self._categorical_imputer.transform(X_categorical)
-            imputed.index = X_null_dropped.index
+            imputed = self._categorical_imputer.transform(X_categorical).to_dataframe()
+            # imputed.index = X_null_dropped.index
             X_null_dropped[X_categorical.columns] = imputed
         X_null_dropped = _convert_to_woodwork_structure(X_null_dropped)
         return X_null_dropped
diff --git a/evalml/pipelines/components/transformers/imputers/simple_imputer.py b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
index f503d6ebe8..e297a43e63 100644
--- a/evalml/pipelines/components/transformers/imputers/simple_imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
@@ -72,14 +72,14 @@ def transform(self, X, y=None):
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         # Convert None to np.nan, since None cannot be properly handled
-        X = X.fillna(value=np.nan) # with woodwork, do we need this?
+        X = X.fillna(value=np.nan)  # with woodwork, do we need this?
         # Return early since bool dtype doesn't support nans and sklearn errors if all cols are bool
         if (X.dtypes == bool).all():
             X = _convert_to_woodwork_structure(X)
             return X
         X_null_dropped = X.copy()
         X_null_dropped.drop(self._all_null_cols, axis=1, errors='ignore', inplace=True)
-        category_cols = X_null_dropped.select_dtypes(include=['category']).columns
+        # category_cols = X_null_dropped.select_dtypes(include=['category']).columns
         X_t = self._component_obj.transform(X)
         if X_null_dropped.empty:
             X_t = pd.DataFrame(X_t, columns=X_null_dropped.columns)
@@ -87,6 +87,8 @@ def transform(self, X, y=None):
             return X_t
         X_t = pd.DataFrame(X_t, columns=X_null_dropped.columns)
         X_t = X_t.infer_objects()
+        X_t.index = X_null_dropped.index
+
         # if len(category_cols) > 0:
         #     X_t[category_cols] = X_t[category_cols].astype('category')
         X_t = _convert_to_woodwork_structure(X_t)
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 4727e34882..0ecd28c19a 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -3,9 +3,9 @@
 from evalml.exceptions import MethodPropertyNotFoundError
 from evalml.model_family import ModelFamily
 from evalml.pipelines.components import ComponentBase
-
 from evalml.utils.gen_utils import _convert_to_woodwork_structure
 
+
 class Transformer(ComponentBase):
     """A component that may or may not need fitting that transforms data.
     These components are used before an estimator.
@@ -56,6 +56,5 @@ def fit_transform(self, X, y=None):
             except MethodPropertyNotFoundError as e:
                 raise e
 
-        if not isinstance(X_t, pd.DataFrame) and isinstance(X, pd.DataFrame):
-            return _convert_to_woodwork_structure(pd.DataFrame(X_t, columns=X.columns, index=X.index))
+        # return _convert_to_woodwork_structure(pd.DataFrame(X_t, columns=X.columns, index=X.index))
         return _convert_to_woodwork_structure(X_t)
diff --git a/evalml/tests/component_tests/test_imputer.py b/evalml/tests/component_tests/test_imputer.py
index d660fb00c6..e2df993bdd 100644
--- a/evalml/tests/component_tests/test_imputer.py
+++ b/evalml/tests/component_tests/test_imputer.py
@@ -238,14 +238,14 @@ def test_imputer_fill_value(imputer_test_data):
         "categorical with nan": pd.Series(["fill", "1", "fill", "0", "3"], dtype='category'),
         "float with nan": [0.0, 1.0, -1, -1.0, 0.],
         "object with nan": pd.Series(["b", "b", "fill", "c", "fill"], dtype='category'),
-        "bool col with nan": [True, "fill", False, "fill", True]
+        "bool col with nan": pd.Series([True, "fill", False, "fill", True], dtype='category')
     })
-    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
+    assert_frame_equal(expected, transformed.to_dataframe(), check_dtype=False)
 
     imputer = Imputer(categorical_impute_strategy="constant", numeric_impute_strategy="constant",
                       categorical_fill_value="fill", numeric_fill_value=-1)
     transformed = imputer.fit_transform(X, y)
-    assert_frame_equal(transformed.to_dataframe(), expected, check_dtype=False)
+    assert_frame_equal(expected, transformed.to_dataframe(), check_dtype=False)
 
 
 def test_imputer_no_nans(imputer_test_data):
@@ -292,13 +292,11 @@ def test_imputer_with_none():
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
-def test_imputer_all_bool_return_original(data_type):
-    X = pd.DataFrame([True, True, False, True, True], dtype=bool)
-    X_expected_arr = pd.DataFrame([True, True, False, True, True], dtype=bool)
-    y = pd.Series([1, 0, 0, 1, 0])
-    if data_type == 'ww':
-        X = ww.DataTable(X)
-        y = ww.DataColumn(y)
+def test_imputer_all_bool_return_original(data_type, make_data_type):
+    X = make_data_type(data_type, pd.DataFrame([True, True, False, True, True], dtype=bool))
+    X_expected_arr = pd.DataFrame([True, True, False, True, True], dtype='boolean')
+    y = make_data_type(data_type, pd.Series([1, 0, 0, 1, 0]))
+
     imputer = Imputer()
     imputer.fit(X, y)
     X_t = imputer.transform(X)
@@ -309,7 +307,7 @@ def test_imputer_all_bool_return_original(data_type):
 def test_imputer_bool_dtype_object(data_type, make_data_type):
     X = pd.DataFrame([True, np.nan, False, np.nan, True], dtype=object)
     y = pd.Series([1, 0, 0, 1, 0])
-    X_expected_arr = pd.DataFrame([True, True, False, True, True], dtype=object)
+    X_expected_arr = pd.DataFrame([True, True, False, True, True], dtype='boolean')
     X = make_data_type(data_type, X)
     y = make_data_type(data_type, y)
     imputer = Imputer()
@@ -326,8 +324,8 @@ def test_imputer_multitype_with_one_bool(data_type):
     })
     y = pd.Series([1, 0, 0, 1, 0])
     X_multi_expected_arr = pd.DataFrame({
-        "bool with nan": pd.Series([True, False, False, False, False], dtype=object),
-        "bool no nan": pd.Series([False, False, False, False, True], dtype=bool),
+        "bool with nan": pd.Series([True, False, False, False, False], dtype='boolean'),
+        "bool no nan": pd.Series([False, False, False, False, True], dtype='boolean'),
     })
     if data_type == 'ww':
         X_multi = ww.DataTable(X_multi)
diff --git a/evalml/tests/component_tests/test_simple_imputer.py b/evalml/tests/component_tests/test_simple_imputer.py
index 8e8687d912..8ac32704f2 100644
--- a/evalml/tests/component_tests/test_simple_imputer.py
+++ b/evalml/tests/component_tests/test_simple_imputer.py
@@ -109,7 +109,7 @@ def test_simple_imputer_all_bool_return_original(data_type, make_data_type):
     y = pd.Series([1, 0, 0, 1, 0])
     X = make_data_type(data_type, X)
     y = make_data_type(data_type, y)
-    X_expected_arr = pd.DataFrame([True, True, False, True, True], dtype=bool)
+    X_expected_arr = pd.DataFrame([True, True, False, True, True], dtype='boolean')
     imputer = SimpleImputer()
     imputer.fit(X, y)
     X_t = imputer.transform(X)

From 3c27d687b58487b2ecf30f20568df0d2d3b7ed03 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 8 Jan 2021 17:46:41 -0500
Subject: [PATCH 05/98] update datetime featurizer

---
 .../preprocessing/datetime_featurizer.py      |  5 +-
 .../test_datetime_featurizer.py               | 58 +++++++++++--------
 2 files changed, 37 insertions(+), 26 deletions(-)

diff --git a/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py b/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
index 660abb9c84..2678deaa81 100644
--- a/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
@@ -94,6 +94,7 @@ def transform(self, X, y=None):
         X_t = X
         features_to_extract = self.parameters["features_to_extract"]
         if len(features_to_extract) == 0:
+            X_t = _convert_to_woodwork_structure(X_t)
             return X_t
         for col_name in self._date_time_col_names:
             for feature in features_to_extract:
@@ -102,7 +103,9 @@ def transform(self, X, y=None):
                 X_t[name] = features
                 if categories:
                     self._categories[name] = categories
-        return X_t.drop(self._date_time_col_names, axis=1)
+        X_t = X_t.drop(self._date_time_col_names, axis=1)
+        X_t = _convert_to_woodwork_structure(X_t)
+        return X_t
 
     def get_feature_names(self):
         """Gets the categories of each datetime feature.
diff --git a/evalml/tests/component_tests/test_datetime_featurizer.py b/evalml/tests/component_tests/test_datetime_featurizer.py
index 1c585d85cd..5294cdfc0e 100644
--- a/evalml/tests/component_tests/test_datetime_featurizer.py
+++ b/evalml/tests/component_tests/test_datetime_featurizer.py
@@ -22,32 +22,35 @@ def test_datetime_featurizer_encodes_as_ints():
     X = pd.DataFrame({"date": ["2016-04-10 16:10:09", "2017-03-15 13:32:05", "2018-07-10 07:15:10",
                                "2019-08-19 20:20:20", "2020-01-03 06:45:12"]})
     dt = DateTimeFeaturizer()
-    X_transformed = dt.fit_transform(X)
-    answer = pd.DataFrame({"date_year": [2016, 2017, 2018, 2019, 2020],
-                           "date_month": [3, 2, 6, 7, 0],
-                           "date_day_of_week": [0, 3, 2, 1, 5],
-                           "date_hour": [16, 13, 7, 20, 6]})
+    X_transformed_df = dt.fit_transform(X)
+    expected = pd.DataFrame({"date_year": pd.Series([2016, 2017, 2018, 2019, 2020], dtype="Int64"),
+                             "date_month": pd.Series([3, 2, 6, 7, 0], dtype="Int64"),
+                             "date_day_of_week": pd.Series([0, 3, 2, 1, 5], dtype="Int64"),
+                             "date_hour": pd.Series([16, 13, 7, 20, 6], dtype="Int64")})
     feature_names = {'date_month': {'April': 3, 'March': 2, 'July': 6, 'August': 7, 'January': 0},
                      'date_day_of_week': {'Sunday': 0, 'Wednesday': 3, 'Tuesday': 2, 'Monday': 1, 'Friday': 5}
                      }
-    pd.testing.assert_frame_equal(X_transformed, answer)
+    pd.testing.assert_frame_equal(expected, X_transformed_df.to_dataframe())
     assert dt.get_feature_names() == feature_names
 
     # Test that changing encode_as_categories to True only changes the dtypes but not the values
     dt_with_cats = DateTimeFeaturizer(encode_as_categories=True)
-    X_transformed = dt_with_cats.fit_transform(X)
-    answer = answer.astype({"date_day_of_week": "category", "date_month": "category"})
-    pd.testing.assert_frame_equal(X_transformed, answer)
+    X_transformed_df = dt_with_cats.fit_transform(X)
+    expected["date_month"] = pd.Categorical([3, 2, 6, 7, 0])
+    expected["date_day_of_week"] = pd.Categorical([0, 3, 2, 1, 5])
+
+    # import pdb; pdb.set_trace()
+    pd.testing.assert_frame_equal(expected, X_transformed_df.to_dataframe())
     assert dt_with_cats.get_feature_names() == feature_names
 
     # Test that sequential calls to the same DateTimeFeaturizer work as expected by using the first dt we defined
     X = pd.DataFrame({"date": ["2020-04-10", "2017-03-15", "2019-08-19"]})
-    X_transformed = dt.fit_transform(X)
-    answer = pd.DataFrame({"date_year": [2020, 2017, 2019],
-                           "date_month": [3, 2, 7],
-                           "date_day_of_week": [5, 3, 1],
-                           "date_hour": [0, 0, 0]})
-    pd.testing.assert_frame_equal(X_transformed, answer)
+    X_transformed_df = dt.fit_transform(X)
+    expected = pd.DataFrame({"date_year": pd.Series([2020, 2017, 2019], dtype="Int64"),
+                             "date_month": pd.Series([3, 2, 7], dtype="Int64"),
+                             "date_day_of_week": pd.Series([5, 3, 1], dtype="Int64"),
+                             "date_hour": pd.Series([0, 0, 0], dtype="Int64")})
+    pd.testing.assert_frame_equal(expected, X_transformed_df.to_dataframe())
     assert dt.get_feature_names() == {'date_month': {'April': 3, 'March': 2, 'August': 7},
                                       'date_day_of_week': {'Friday': 5, 'Wednesday': 3, 'Monday': 1}}
 
@@ -67,10 +70,10 @@ def test_datetime_featurizer_transform():
                            'Date Col 2': pd.date_range('2020-02-03', periods=20, freq='W'),
                            'Numerical 2': [0] * 20})
     datetime_transformer.fit(X)
-    transformed = datetime_transformer.transform(X_test)
-    assert list(transformed.columns) == ['Numerical 1', 'Numerical 2', 'Date Col 1_year', 'Date Col 2_year']
-    assert transformed["Date Col 1_year"].equals(pd.Series([2020] * 20))
-    assert transformed["Date Col 2_year"].equals(pd.Series([2020] * 20))
+    transformed_df = datetime_transformer.transform(X_test).to_dataframe()
+    assert list(transformed_df.columns) == ['Numerical 1', 'Numerical 2', 'Date Col 1_year', 'Date Col 2_year']
+    assert transformed_df["Date Col 1_year"].equals(pd.Series([2020] * 20, dtype="Int64"))
+    assert transformed_df["Date Col 2_year"].equals(pd.Series([2020] * 20, dtype="Int64"))
     assert datetime_transformer.get_feature_names() == {}
 
 
@@ -80,10 +83,10 @@ def test_datetime_featurizer_fit_transform():
                       'Date Col 1': pd.date_range('2020-05-19', periods=20, freq='D'),
                       'Date Col 2': pd.date_range('2020-02-03', periods=20, freq='W'),
                       'Numerical 2': [0] * 20})
-    transformed = datetime_transformer.fit_transform(X)
-    assert list(transformed.columns) == ['Numerical 1', 'Numerical 2', 'Date Col 1_year', 'Date Col 2_year']
-    assert transformed["Date Col 1_year"].equals(pd.Series([2020] * 20))
-    assert transformed["Date Col 2_year"].equals(pd.Series([2020] * 20))
+    transformed_df = datetime_transformer.fit_transform(X).to_dataframe()
+    assert list(transformed_df.columns) == ['Numerical 1', 'Numerical 2', 'Date Col 1_year', 'Date Col 2_year']
+    assert transformed_df["Date Col 1_year"].equals(pd.Series([2020] * 20, dtype="Int64"))
+    assert transformed_df["Date Col 2_year"].equals(pd.Series([2020] * 20, dtype="Int64"))
     assert datetime_transformer.get_feature_names() == {}
 
 
@@ -102,8 +105,11 @@ def test_datetime_featurizer_no_features_to_extract():
     datetime_transformer = DateTimeFeaturizer(features_to_extract=[])
     rng = pd.date_range('2020-02-24', periods=20, freq='D')
     X = pd.DataFrame({"date col": rng, "numerical": [0] * len(rng)})
+    expected = X
+    expected["numerical"] = expected["numerical"].astype("Int64")
     datetime_transformer.fit(X)
-    assert datetime_transformer.transform(X).equals(X)
+    transformed = datetime_transformer.transform(X).to_dataframe()
+    pd.testing.assert_frame_equal(expected, transformed)
     assert datetime_transformer.get_feature_names() == {}
 
 
@@ -119,8 +125,10 @@ def test_datetime_featurizer_custom_features_to_extract():
 def test_datetime_featurizer_no_datetime_cols():
     datetime_transformer = DateTimeFeaturizer(features_to_extract=["year", "month"])
     X = pd.DataFrame([[1, 3, 4], [2, 5, 2]])
+    expected = X.astype("Int64")
     datetime_transformer.fit(X)
-    assert datetime_transformer.transform(X).equals(X)
+    transformed = datetime_transformer.transform(X).to_dataframe()
+    pd.testing.assert_frame_equal(expected, transformed)
     assert datetime_transformer.get_feature_names() == {}
 
 
From 482d2f1579e3eda46bfb1d7b8c3c1931176524b3 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sat, 9 Jan 2021 01:36:20 -0500
Subject: [PATCH 06/98] update per_column_imputer

---
 .../imputers/per_column_imputer.py            |  4 +--
 .../test_per_column_imputer.py                | 35 +++++++++----------
 2 files changed, 19 insertions(+), 20 deletions(-)

diff --git a/evalml/pipelines/components/transformers/imputers/per_column_imputer.py b/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
index 8ddf18bc37..6e5bb18854 100644
--- a/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
@@ -80,11 +80,11 @@ def transform(self, X, y=None):
         X_t = X.copy()
         cols_to_drop = []
         for column, imputer in self.imputers.items():
-            transformed = imputer.transform(X[[column]])
+            transformed = imputer.transform(X[[column]]).to_dataframe()
             if transformed.empty:
                 cols_to_drop.append(column)
             else:
-                X_t[column] = transformed
+                X_t[column] = transformed[column]
         X_t = X_t.drop(cols_to_drop, axis=1)
         return X_t
 
diff --git a/evalml/tests/component_tests/test_per_column_imputer.py b/evalml/tests/component_tests/test_per_column_imputer.py
index 71c8cf1ced..cf9d45076d 100644
--- a/evalml/tests/component_tests/test_per_column_imputer.py
+++ b/evalml/tests/component_tests/test_per_column_imputer.py
@@ -27,18 +27,15 @@ def test_invalid_parameters():
 
 
 def test_all_strategies():
-    X = pd.DataFrame([[2, 4, 6, "a"],
-                      [4, 6, 8, "a"],
-                      [6, 4, 8, "b"],
-                      [np.nan, np.nan, np.nan, np.nan]])
+    X = pd.DataFrame({"A": pd.Series([2, 4, 6, np.nan]),
+                      "B": pd.Series([4, 6, 4, np.nan]),
+                      "C": pd.Series([6, 8, 8, np.nan]),
+                      "D": pd.Series(["a", "a", "b", np.nan])})
 
-    X_expected = pd.DataFrame([[2, 4, 6, "a"],
-                               [4, 6, 8, "a"],
-                               [6, 4, 8, "b"],
-                               [4, 4, 100, "a"]])
-
-    X.columns = ['A', 'B', 'C', 'D']
-    X_expected.columns = ['A', 'B', 'C', 'D']
+    X_expected = pd.DataFrame({"A": pd.Series([2, 4, 6, 4], dtype="int64"),
+                               "B": pd.Series([4, 6, 4, 4], dtype="int64"),
+                               "C": pd.Series([6, 8, 8, 100], dtype="int64"),
+                               "D": pd.Series(["a", "a", "b", "a"], dtype="category")})
 
     strategies = {
         'A': {"impute_strategy": "mean"},
@@ -108,14 +105,13 @@ def test_non_numeric_valid(non_numeric_df):
     strategies = {'C': {"impute_strategy": "most_frequent"}}
     transformer = PerColumnImputer(impute_strategies=strategies)
 
-    X_expected = pd.DataFrame([["a", "a", "a", "a"],
-                               ["b", "b", "b", "b"],
-                               ["a", "a", "a", "a"],
-                               ["a", "a", "a", "a"]])
-    X_expected.columns = ['A', 'B', 'C', 'D']
+    X_expected = pd.DataFrame({"A": pd.Series(["a", "b", "a", "a"], dtype="category"),
+                               "B": pd.Series(["a", "b", "a", "a"], dtype="category"),
+                               "C": pd.Series(["a", "b", "a", "a"], dtype="category"),
+                               "D": pd.Series(["a", "b", "a", "a"], dtype="category")})
 
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected, X_t, check_dtype=False)
+    assert_frame_equal(X_expected, X_t)
 
     # constant with all strings
     strategies = {'D': {"impute_strategy": "constant", "fill_value": 100}}
@@ -126,7 +122,10 @@ def test_non_numeric_valid(non_numeric_df):
                                ["a", "a", "a", "a"],
                                ["a", "a", "a", 100]])
     X_expected.columns = ['A', 'B', 'C', 'D']
-
+    X_expected = pd.DataFrame({"A": pd.Series(["a", "b", "a", "a"], dtype="category"),
+                               "B": pd.Series(["a", "b", "a", "a"], dtype="category"),
+                               "C": pd.Series(["a", "b", "a", "a"], dtype="category"),
+                               "D": pd.Series(["a", "b", "a", 100], dtype="category")})
     X_t = transformer.fit_transform(X)
     assert_frame_equal(X_expected, X_t, check_dtype=False)
 

From 2ad05261b1b5c4d1618222ef030fc0395b054580 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sat, 9 Jan 2021 01:58:33 -0500
Subject: [PATCH 07/98] fix per col imputer tests

---
 .../imputers/per_column_imputer.py            |  1 +
 .../test_per_column_imputer.py                | 19 ++++++++++---------
 2 files changed, 11 insertions(+), 9 deletions(-)

diff --git a/evalml/pipelines/components/transformers/imputers/per_column_imputer.py b/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
index 6e5bb18854..c6b0a477ed 100644
--- a/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
@@ -86,6 +86,7 @@ def transform(self, X, y=None):
             else:
                 X_t[column] = transformed[column]
         X_t = X_t.drop(cols_to_drop, axis=1)
+        X_t = _convert_to_woodwork_structure(X_t)
         return X_t
 
     def fit_transform(self, X, y=None):
diff --git a/evalml/tests/component_tests/test_per_column_imputer.py b/evalml/tests/component_tests/test_per_column_imputer.py
index cf9d45076d..d2d508ac85 100644
--- a/evalml/tests/component_tests/test_per_column_imputer.py
+++ b/evalml/tests/component_tests/test_per_column_imputer.py
@@ -46,7 +46,7 @@ def test_all_strategies():
 
     transformer = PerColumnImputer(impute_strategies=strategies)
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected, X_t, check_dtype=False)
+    assert_frame_equal(X_expected, X_t.to_dataframe(), check_dtype=False)
 
 
 def test_fit_transform():
@@ -62,7 +62,6 @@ def test_fit_transform():
 
     X.columns = ['A']
     X_expected.columns = ['A']
-
     strategies = {'A': {"impute_strategy": "median"}}
 
     transformer = PerColumnImputer(impute_strategies=strategies)
@@ -72,7 +71,7 @@ def test_fit_transform():
     transformer = PerColumnImputer(impute_strategies=strategies)
     X_fit_transform = transformer.fit_transform(X)
 
-    assert_frame_equal(X_t, X_fit_transform, check_dtype=False)
+    assert_frame_equal(X_t.to_dataframe(), X_fit_transform.to_dataframe())
 
 
 def test_non_numeric_errors(non_numeric_df):
@@ -111,7 +110,7 @@ def test_non_numeric_valid(non_numeric_df):
                                "D": pd.Series(["a", "b", "a", "a"], dtype="category")})
 
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected, X_t)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
     # constant with all strings
     strategies = {'D': {"impute_strategy": "constant", "fill_value": 100}}
@@ -127,7 +126,7 @@ def test_non_numeric_valid(non_numeric_df):
                                "C": pd.Series(["a", "b", "a", "a"], dtype="category"),
                                "D": pd.Series(["a", "b", "a", 100], dtype="category")})
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected, X_t, check_dtype=False)
+    assert_frame_equal(X_expected, X_t.to_dataframe(), check_dtype=False)
 
 
 def test_fit_transform_drop_all_nan_columns():
@@ -140,7 +139,7 @@ def test_fit_transform_drop_all_nan_columns():
     transformer = PerColumnImputer(impute_strategies=strategies)
     X_expected_arr = pd.DataFrame({"some_nan": [0, 1, 0], "another_col": [0, 1, 2]})
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected_arr, X_t, check_dtype=False)
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe(), check_dtype=False)
     assert_frame_equal(X, pd.DataFrame({"all_nan": [np.nan, np.nan, np.nan],
                                         "some_nan": [np.nan, 1, 0],
                                         "another_col": [0, 1, 2]}))
@@ -156,7 +155,9 @@ def test_transform_drop_all_nan_columns():
     transformer = PerColumnImputer(impute_strategies=strategies)
     transformer.fit(X)
     X_expected_arr = pd.DataFrame({"some_nan": [0, 1, 0], "another_col": [0, 1, 2]})
-    assert_frame_equal(X_expected_arr, transformer.transform(X), check_dtype=False)
+    X_t = transformer.transform(X)
+
+    assert_frame_equal(X_expected_arr, X_t.to_dataframe(), check_dtype=False)
     assert_frame_equal(X, pd.DataFrame({"all_nan": [np.nan, np.nan, np.nan],
                                         "some_nan": [np.nan, 1, 0],
                                         "another_col": [0, 1, 2]}))
@@ -166,11 +167,11 @@ def test_transform_drop_all_nan_columns_empty():
     X = pd.DataFrame([[np.nan, np.nan, np.nan]])
     strategies = {'0': {"impute_strategy": "most_frequent"}, }
     transformer = PerColumnImputer(impute_strategies=strategies)
-    assert transformer.fit_transform(X).empty
+    assert transformer.fit_transform(X).to_dataframe().empty
     assert_frame_equal(X, pd.DataFrame([[np.nan, np.nan, np.nan]]))
 
     strategies = {'0': {"impute_strategy": "most_frequent"}}
     transformer = PerColumnImputer(impute_strategies=strategies)
     transformer.fit(X)
-    assert transformer.transform(X).empty
+    assert transformer.transform(X).to_dataframe().empty
     assert_frame_equal(X, pd.DataFrame([[np.nan, np.nan, np.nan]]))

From 001dc59980722e63bb17e4b914226956a4045c2e Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sat, 9 Jan 2021 16:26:07 -0500
Subject: [PATCH 08/98] fix drop null cols tests

---
 .../transformers/imputers/imputer.py          | 10 +++---
 .../imputers/per_column_imputer.py            |  4 +--
 .../transformers/imputers/simple_imputer.py   |  4 +--
 .../preprocessing/drop_null_columns.py        | 11 +++---
 .../test_drop_null_columns_transformer.py     | 35 +++++++++++++------
 5 files changed, 40 insertions(+), 24 deletions(-)

diff --git a/evalml/pipelines/components/transformers/imputers/imputer.py b/evalml/pipelines/components/transformers/imputers/imputer.py
index 3107909427..2727db101b 100644
--- a/evalml/pipelines/components/transformers/imputers/imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/imputer.py
@@ -57,8 +57,8 @@ def fit(self, X, y=None):
             treated as the same.
 
         Arguments:
-            X (pd.DataFrame or np.ndarray): The input training data of shape [n_samples, n_features]
-            y (pd.Series, optional): The target training data of length [n_samples]
+            X (ww.DataTable, pd.DataFrame or np.ndarray): The input training data of shape [n_samples, n_features]
+            y (ww.DataColumn, pd.Series, optional): The target training data of length [n_samples]
 
         Returns:
             self
@@ -89,11 +89,11 @@ def transform(self, X, y=None):
             treated as the same.
 
         Arguments:
-            X (pd.DataFrame): Data to transform
-            y (pd.Series, optional): Ignored.
+            X (ww.DataTable, pd.DataFrame): Data to transform
+            y (ww.DataColumn, pd.Series, optional): Ignored.
 
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
diff --git a/evalml/pipelines/components/transformers/imputers/per_column_imputer.py b/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
index c6b0a477ed..e5508ee433 100644
--- a/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
@@ -73,7 +73,7 @@ def transform(self, X, y=None):
             y (ww.DataColumn, pd.Series, optional): The target training data of length [n_samples]. Ignored.
 
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
@@ -97,7 +97,7 @@ def fit_transform(self, X, y=None):
             y (ww.DataColumn, pd.Series, optional): The target training data of length [n_samples]. Ignored.
 
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
 
         self.fit(X, y)
diff --git a/evalml/pipelines/components/transformers/imputers/simple_imputer.py b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
index e297a43e63..f11c84b40a 100644
--- a/evalml/pipelines/components/transformers/imputers/simple_imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
@@ -67,7 +67,7 @@ def transform(self, X, y=None):
             y (ww.DataColumn, pd.Series, optional): Ignored.
 
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
@@ -102,6 +102,6 @@ def fit_transform(self, X, y=None):
             y (ww.DataColumn, pd.Series, optional): Target data.
 
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
         return self.fit(X, y).transform(X, y)
diff --git a/evalml/pipelines/components/transformers/preprocessing/drop_null_columns.py b/evalml/pipelines/components/transformers/preprocessing/drop_null_columns.py
index 9ba7981b5c..3189ade525 100644
--- a/evalml/pipelines/components/transformers/preprocessing/drop_null_columns.py
+++ b/evalml/pipelines/components/transformers/preprocessing/drop_null_columns.py
@@ -44,12 +44,13 @@ def transform(self, X, y=None):
         """Transforms data X by dropping columns that exceed the threshold of null values.
 
         Arguments:
-            X (pd.DataFrame): Data to transform
-            y (pd.Series, optional): Ignored.
+            X (ww.DataTable, pd.DataFrame): Data to transform
+            y (ww.DataColumn, pd.Series, optional): Ignored.
 
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
         X_t = _convert_to_woodwork_structure(X)
-        X_t = _convert_woodwork_types_wrapper(X_t.to_dataframe())
-        return X_t.drop(columns=self._cols_to_drop, axis=1)
+        # X_t = _convert_woodwork_types_wrapper(X_t.to_dataframe())
+        # return X_t.drop(columns=self._cols_to_drop, axis=1)
+        return X_t.drop(self._cols_to_drop)
diff --git a/evalml/tests/component_tests/test_drop_null_columns_transformer.py b/evalml/tests/component_tests/test_drop_null_columns_transformer.py
index 0e4f6786ab..2fe1cba719 100644
--- a/evalml/tests/component_tests/test_drop_null_columns_transformer.py
+++ b/evalml/tests/component_tests/test_drop_null_columns_transformer.py
@@ -1,6 +1,7 @@
 import numpy as np
 import pandas as pd
 import pytest
+from pandas.testing import assert_frame_equal
 
 from evalml.pipelines.components import DropNullColumns
 
@@ -29,8 +30,10 @@ def test_drop_null_transformer_transform_default_pct_null_threshold():
     drop_null_transformer = DropNullColumns()
     X = pd.DataFrame({'lots_of_null': [None, None, None, None, 5],
                       'no_null': [1, 2, 3, 4, 5]})
+    X_expected = X.astype({'lots_of_null': 'float64', 'no_null': 'Int64'})
     drop_null_transformer.fit(X)
-    assert drop_null_transformer.transform(X).equals(X)
+    X_t = drop_null_transformer.transform(X)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
 
 def test_drop_null_transformer_transform_custom_pct_null_threshold():
@@ -39,8 +42,11 @@ def test_drop_null_transformer_transform_custom_pct_null_threshold():
                       'no_null': [1, 2, 3, 4, 5]})
 
     drop_null_transformer = DropNullColumns(pct_null_threshold=0.5)
+    X_expected = X.drop(["lots_of_null", "all_null"], axis=1)
+    X_expected = X_expected.astype({"no_null": "Int64"})
     drop_null_transformer.fit(X)
-    assert drop_null_transformer.transform(X).equals(X.drop(["lots_of_null", "all_null"], axis=1))
+    X_t = drop_null_transformer.transform(X)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
     # check that X is untouched
     assert X.equals(pd.DataFrame({'lots_of_null': [None, None, None, None, 5],
                                   'all_null': [None, None, None, None, None],
@@ -53,11 +59,13 @@ def test_drop_null_transformer_transform_boundary_pct_null_threshold():
                       'lots_of_null': [None, None, None, None, 5],
                       'some_null': [None, 0, 3, 4, 5]})
     drop_null_transformer.fit(X)
-    assert drop_null_transformer.transform(X).empty
+    X_t = drop_null_transformer.transform(X)
+    assert X_t.to_dataframe().empty
 
     drop_null_transformer = DropNullColumns(pct_null_threshold=1.0)
     drop_null_transformer.fit(X)
-    assert drop_null_transformer.transform(X).equals(X.drop(["all_null"], axis=1))
+    X_t = drop_null_transformer.transform(X)
+    assert_frame_equal(X_t.to_dataframe(), X.drop(["all_null"], axis=1))
     # check that X is untouched
     assert X.equals(pd.DataFrame({'all_null': [None, None, None, None, None],
                                   'lots_of_null': [None, None, None, None, 5],
@@ -68,14 +76,18 @@ def test_drop_null_transformer_fit_transform():
     drop_null_transformer = DropNullColumns()
     X = pd.DataFrame({'lots_of_null': [None, None, None, None, 5],
                       'no_null': [1, 2, 3, 4, 5]})
-    assert drop_null_transformer.fit_transform(X).equals(X)
+    X_expected = X.astype({'lots_of_null': 'float64', 'no_null': 'Int64'})
+    X_t = drop_null_transformer.fit_transform(X)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
     X = pd.DataFrame({'lots_of_null': [None, None, None, None, 5],
                       'all_null': [None, None, None, None, None],
                       'no_null': [1, 2, 3, 4, 5]})
-
     drop_null_transformer = DropNullColumns(pct_null_threshold=0.5)
-    assert drop_null_transformer.fit_transform(X).equals(X.drop(["lots_of_null", "all_null"], axis=1))
+    X_expected = X.drop(["lots_of_null", "all_null"], axis=1)
+    X_expected = X_expected.astype({'no_null': 'Int64'})
+    X_t = drop_null_transformer.fit_transform(X)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
     # check that X is untouched
     assert X.equals(pd.DataFrame({'lots_of_null': [None, None, None, None, 5],
                                   'all_null': [None, None, None, None, None],
@@ -84,13 +96,15 @@ def test_drop_null_transformer_fit_transform():
     drop_null_transformer = DropNullColumns(pct_null_threshold=0.0)
     X = pd.DataFrame({'lots_of_null': [None, None, None, None, 5],
                       'some_null': [None, 0, 3, 4, 5]})
-    assert drop_null_transformer.fit_transform(X).empty
+    X_t = drop_null_transformer.fit_transform(X)
+    assert X_t.to_dataframe().empty
 
     X = pd.DataFrame({'all_null': [None, None, None, None, None],
                       'lots_of_null': [None, None, None, None, 5],
                       'some_null': [None, 0, 3, 4, 5]})
     drop_null_transformer = DropNullColumns(pct_null_threshold=1.0)
-    assert drop_null_transformer.fit_transform(X).equals(X.drop(["all_null"], axis=1))
+    X_t = drop_null_transformer.fit_transform(X)
+    assert_frame_equal(X_t.to_dataframe(), X.drop(["all_null"], axis=1))
 
 
 def test_drop_null_transformer_np_array():
@@ -99,7 +113,8 @@ def test_drop_null_transformer_np_array():
                   [np.nan, 1, np.nan, 0],
                   [np.nan, 2, np.nan, 0],
                   [np.nan, 1, 1, 0]])
-    assert drop_null_transformer.fit_transform(X).equals(pd.DataFrame(np.delete(X, [0, 2], axis=1), columns=[1, 3]))
+    X_t = drop_null_transformer.fit_transform(X)
+    assert_frame_equal(X_t.to_dataframe(), pd.DataFrame(np.delete(X, [0, 2], axis=1), columns=[1, 3]))
 
     # check that X is untouched
     np.testing.assert_allclose(X, np.array([[np.nan, 0, 2, 0],

From a24468d700ab2b7ea68b984adcd8b50f2b3e7c31 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sat, 9 Jan 2021 16:58:17 -0500
Subject: [PATCH 09/98] fix ohe tests

---
 .../transformers/encoders/onehot_encoder.py   |  1 +
 .../component_tests/test_one_hot_encoder.py   | 27 ++++++++++---------
 2 files changed, 15 insertions(+), 13 deletions(-)

diff --git a/evalml/pipelines/components/transformers/encoders/onehot_encoder.py b/evalml/pipelines/components/transformers/encoders/onehot_encoder.py
index 1cf3049a2f..4c732cd775 100644
--- a/evalml/pipelines/components/transformers/encoders/onehot_encoder.py
+++ b/evalml/pipelines/components/transformers/encoders/onehot_encoder.py
@@ -151,6 +151,7 @@ def transform(self, X, y=None):
             X_cat.columns = self.get_feature_names()
             X_t = pd.concat([X_t, X_cat], axis=1)
 
+        X_t = _convert_to_woodwork_structure(X_t)
         return X_t
 
     def _handle_parameter_handle_missing(self, X):
diff --git a/evalml/tests/component_tests/test_one_hot_encoder.py b/evalml/tests/component_tests/test_one_hot_encoder.py
index 97ce57f773..8fc1384c48 100644
--- a/evalml/tests/component_tests/test_one_hot_encoder.py
+++ b/evalml/tests/component_tests/test_one_hot_encoder.py
@@ -2,6 +2,7 @@
 import pandas as pd
 import pytest
 import woodwork as ww
+from pandas.testing import assert_frame_equal
 
 from evalml.exceptions import ComponentNotYetFittedError
 from evalml.pipelines.components import OneHotEncoder
@@ -160,7 +161,7 @@ def test_handle_unknown():
 
     encoder = OneHotEncoder(handle_unknown='error')
     encoder.fit(X)
-    assert isinstance(encoder.transform(X), pd.DataFrame)
+    assert isinstance(encoder.transform(X), ww.DataTable)
 
     X = pd.DataFrame({"col_1": ["x", "b", "c", "d", "e", "f", "g"],
                       "col_2": ["a", "c", "d", "b", "e", "e", "f"],
@@ -319,7 +320,7 @@ def test_categorical_dtype():
 
     encoder = OneHotEncoder(top_n=5)
     encoder.fit(X)
-    X_t = encoder.transform(X)
+    X_t = encoder.transform(X).to_dataframe()
 
     expected_col_names = set(["col_1_f", "col_1_b", "col_1_c", "col_1_d", "col_1_e",
                               "col_2_d", "col_2_e", "col_2_a", "col_3_a",
@@ -335,11 +336,11 @@ def test_all_numerical_dtype():
                       "col_2": [3, 2, 5, 1, 3],
                       "col_3": [0, 0, 1, 3, 2],
                       "col_4": [2, 4, 1, 4, 0]})
-
+    X_expected = X.astype("Int64")
     encoder = OneHotEncoder(top_n=5)
     encoder.fit(X)
     X_t = encoder.transform(X)
-    assert X.equals(X_t)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
 
 def test_numpy_input():
@@ -347,7 +348,7 @@ def test_numpy_input():
     encoder = OneHotEncoder()
     encoder.fit(X)
     X_t = encoder.transform(X)
-    pd.testing.assert_frame_equal(pd.DataFrame(X), X_t, check_dtype=False)
+    assert_frame_equal(pd.DataFrame(X), X_t.to_dataframe(), check_dtype=False)
 
 
 def test_large_number_of_categories():
@@ -380,7 +381,7 @@ def test_data_types(data_type):
         X = ww.DataTable(pd.DataFrame(["a", "b", "c"]))
     encoder = OneHotEncoder()
     encoder.fit(X)
-    X_t = encoder.transform(X)
+    X_t = encoder.transform(X).to_dataframe()
     assert list(X_t.columns) == ['0_a', '0_b', '0_c']
     np.testing.assert_array_equal(X_t.to_numpy(), np.identity(3))
 
@@ -394,7 +395,7 @@ def test_ohe_preserves_custom_index(index):
     df = pd.DataFrame({"categories": [f"cat_{i}" for i in range(5)], "numbers": np.arange(5)},
                       index=index)
     ohe = OneHotEncoder()
-    new_df = ohe.fit_transform(df)
+    new_df = ohe.fit_transform(df).to_dataframe()
     pd.testing.assert_index_equal(new_df.index, df.index)
     assert not new_df.isna().any(axis=None)
 
@@ -431,7 +432,7 @@ def test_ohe_features_to_encode():
 
     encoder = OneHotEncoder(top_n=5, features_to_encode=['col_1'])
     encoder.fit(X)
-    X_t = encoder.transform(X)
+    X_t = encoder.transform(X).to_dataframe()
     expected_col_names = set(['col_1_0', 'col_1_1', 'col_1_2', 'col_2'])
     col_names = set(X_t.columns)
     assert (col_names == expected_col_names)
@@ -439,7 +440,7 @@ def test_ohe_features_to_encode():
 
     encoder = OneHotEncoder(top_n=5, features_to_encode=['col_1', 'col_2'])
     encoder.fit(X)
-    X_t = encoder.transform(X)
+    X_t = encoder.transform(X).to_dataframe()
     expected_col_names = set(['col_1_0', 'col_1_1', 'col_1_2',
                               'col_2_a', 'col_2_b', 'col_2_c', 'col_2_d'])
     col_names = set(X_t.columns)
@@ -461,7 +462,7 @@ def test_ohe_features_to_encode_no_col_names():
     X = pd.DataFrame([["b", 0], ["a", 1]])
     encoder = OneHotEncoder(top_n=5, features_to_encode=[0])
     encoder.fit(X)
-    X_t = encoder.transform(X)
+    X_t = encoder.transform(X).to_dataframe()
     expected_col_names = set([1, "0_a", "0_b"])
     col_names = set(X_t.columns)
     assert (col_names == expected_col_names)
@@ -474,9 +475,9 @@ def test_ohe_top_n_categories_always_the_same():
 
     def check_df_equality(random_state):
         ohe = OneHotEncoder(top_n=4, random_state=random_state)
-        df1 = ohe.fit_transform(df)
-        df2 = ohe.fit_transform(df)
-        pd.testing.assert_frame_equal(df1, df2)
+        df1 = ohe.fit_transform(df).to_dataframe()
+        df2 = ohe.fit_transform(df).to_dataframe()
+        assert_frame_equal(df1, df2)
 
     check_df_equality(5)
     check_df_equality(get_random_state(5))

From f4eb8c09fcb97454363948c9e11a1c9af4b61981 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sun, 10 Jan 2021 03:33:37 -0500
Subject: [PATCH 10/98] fix pca

---
 .../dimensionality_reduction/pca.py           |  6 +++--
 evalml/tests/component_tests/test_pca.py      | 22 +++++++++----------
 2 files changed, 15 insertions(+), 13 deletions(-)

diff --git a/evalml/pipelines/components/transformers/dimensionality_reduction/pca.py b/evalml/pipelines/components/transformers/dimensionality_reduction/pca.py
index 9502eeca91..7f714919ec 100644
--- a/evalml/pipelines/components/transformers/dimensionality_reduction/pca.py
+++ b/evalml/pipelines/components/transformers/dimensionality_reduction/pca.py
@@ -50,7 +50,8 @@ def transform(self, X, y=None):
             raise ValueError("PCA input must be all numeric")
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         X_t = self._component_obj.transform(X)
-        return pd.DataFrame(X_t, index=X.index, columns=[f"component_{i}" for i in range(X_t.shape[1])])
+        X_t = pd.DataFrame(X_t, index=X.index, columns=[f"component_{i}" for i in range(X_t.shape[1])])
+        return _convert_to_woodwork_structure(X_t)
 
     def fit_transform(self, X, y=None):
         X = _convert_to_woodwork_structure(X)
@@ -58,4 +59,5 @@ def fit_transform(self, X, y=None):
             raise ValueError("PCA input must be all numeric")
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         X_t = self._component_obj.fit_transform(X, y)
-        return pd.DataFrame(X_t, index=X.index, columns=[f"component_{i}" for i in range(X_t.shape[1])])
+        X_t = pd.DataFrame(X_t, index=X.index, columns=[f"component_{i}" for i in range(X_t.shape[1])])
+        return _convert_to_woodwork_structure(X_t)
diff --git a/evalml/tests/component_tests/test_pca.py b/evalml/tests/component_tests/test_pca.py
index fa88725b89..9bb28d208b 100644
--- a/evalml/tests/component_tests/test_pca.py
+++ b/evalml/tests/component_tests/test_pca.py
@@ -21,8 +21,8 @@ def test_pca_numeric(data_type, make_data_type):
                                  [-4.079174, -0.252790],
                                  [-0.112877, -0.755922]],
                                 columns=[f"component_{i}" for i in range(2)])
-    X_t = pd.DataFrame(pca.fit_transform(X))
-    assert_frame_equal(X_t, expected_X_t)
+    X_t = pca.fit_transform(X)
+    assert_frame_equal(expected_X_t, X_t.to_dataframe())
 
 
 def test_pca_array():
@@ -39,8 +39,8 @@ def test_pca_array():
                                  [-0.112877, -0.755922]],
                                 columns=[f"component_{i}" for i in range(2)])
     pca.fit(X)
-    X_t = pd.DataFrame(pca.transform(X))
-    assert_frame_equal(X_t, expected_X_t)
+    X_t = pca.transform(X)
+    assert_frame_equal(expected_X_t, X_t.to_dataframe())
 
 
 def test_pca_invalid():
@@ -86,15 +86,15 @@ def test_variance():
                                  [7.067179, 0.645894, -2.633617, 2.159135],
                                  [6.828241, -3.867796, 2.597358, -1.740404]],
                                 columns=[f"component_{i}" for i in range(4)])
-    X_t_90 = pd.DataFrame(pca.fit_transform(X))
-    assert_frame_equal(X_t_90, expected_X_t)
+    X_t_90 = pca.fit_transform(X)
+    assert_frame_equal(expected_X_t, X_t_90.to_dataframe())
 
     pca = PCA(variance=0.75)
-    X_t_75 = pd.DataFrame(pca.fit_transform(X))
+    X_t_75 = pca.fit_transform(X)
     assert X_t_75.shape[1] < X_t_90.shape[1]
 
     pca = PCA(variance=0.50)
-    X_t_50 = pd.DataFrame(pca.fit_transform(X))
+    X_t_50 = pca.fit_transform(X)
     assert X_t_50.shape[1] < X_t_75.shape[1]
 
 
@@ -105,13 +105,13 @@ def test_n_components():
                       [10, 6, 4, 4, 0, 1],
                       [6, 8, 9, 3, 1, 5]])
     pca = PCA(n_components=5)
-    X_t = pd.DataFrame(pca.fit_transform(X))
+    X_t = pca.fit_transform(X)
     assert X_t.shape[1] == 5
 
     pca = PCA(n_components=3)
-    X_t = pd.DataFrame(pca.fit_transform(X))
+    X_t = pca.fit_transform(X)
     assert X_t.shape[1] == 3
 
     pca = PCA(n_components=1)
-    X_t = pd.DataFrame(pca.fit_transform(X))
+    X_t = pca.fit_transform(X)
     assert X_t.shape[1] == 1

From 49c8400ed17f5e6da54b244d1ab0c9bebf8215ab Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sun, 10 Jan 2021 03:47:53 -0500
Subject: [PATCH 11/98] fix lda

---
 .../transformers/dimensionality_reduction/lda.py     |  6 ++++--
 evalml/tests/component_tests/test_lda.py             | 12 ++++++------
 2 files changed, 10 insertions(+), 8 deletions(-)

diff --git a/evalml/pipelines/components/transformers/dimensionality_reduction/lda.py b/evalml/pipelines/components/transformers/dimensionality_reduction/lda.py
index fc0ca2fde6..e53c429511 100644
--- a/evalml/pipelines/components/transformers/dimensionality_reduction/lda.py
+++ b/evalml/pipelines/components/transformers/dimensionality_reduction/lda.py
@@ -52,7 +52,8 @@ def transform(self, X, y=None):
             raise ValueError("LDA input must be all numeric")
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         X_t = self._component_obj.transform(X)
-        return pd.DataFrame(X_t, index=X.index, columns=[f"component_{i}" for i in range(X_t.shape[1])])
+        X_t = pd.DataFrame(X_t, index=X.index, columns=[f"component_{i}" for i in range(X_t.shape[1])])
+        return _convert_to_woodwork_structure(X_t)
 
     def fit_transform(self, X, y=None):
         X = _convert_to_woodwork_structure(X)
@@ -63,4 +64,5 @@ def fit_transform(self, X, y=None):
         y = _convert_woodwork_types_wrapper(y.to_series())
 
         X_t = self._component_obj.fit_transform(X, y)
-        return pd.DataFrame(X_t, index=X.index, columns=[f"component_{i}" for i in range(X_t.shape[1])])
+        X_t = pd.DataFrame(X_t, index=X.index, columns=[f"component_{i}" for i in range(X_t.shape[1])])
+        return _convert_to_woodwork_structure(X_t)
diff --git a/evalml/tests/component_tests/test_lda.py b/evalml/tests/component_tests/test_lda.py
index bd3ff187b9..675f775297 100644
--- a/evalml/tests/component_tests/test_lda.py
+++ b/evalml/tests/component_tests/test_lda.py
@@ -28,8 +28,8 @@ def test_lda_numeric(data_type, make_data_type):
                                  [1.3401547523131798],
                                  [3.659653362085993]],
                                 columns=["component_0"])
-    X_t = pd.DataFrame(lda.fit_transform(X, y))
-    assert_frame_equal(X_t, expected_X_t)
+    X_t = lda.fit_transform(X, y)
+    assert_frame_equal(expected_X_t, X_t.to_dataframe())
 
 
 def test_lda_array():
@@ -47,8 +47,8 @@ def test_lda_array():
                                  [-0.4751798337481819, -0.7065437888758568]],
                                 columns=[f"component_{i}" for i in range(2)])
     lda.fit(X, y)
-    X_t = pd.DataFrame(lda.transform(X))
-    assert_frame_equal(X_t, expected_X_t)
+    X_t = lda.transform(X)
+    assert_frame_equal(expected_X_t, X_t.to_dataframe())
 
 
 def test_lda_invalid():
@@ -93,11 +93,11 @@ def test_n_components():
     y = [0, 3, 3, 1, 2, 0, 2]
 
     lda = LinearDiscriminantAnalysis(n_components=3)
-    X_t = pd.DataFrame(lda.fit_transform(X, y))
+    X_t = lda.fit_transform(X, y)
     assert X_t.shape[1] == 3
 
     lda = LinearDiscriminantAnalysis(n_components=1)
-    X_t = pd.DataFrame(lda.fit_transform(X, y))
+    X_t = lda.fit_transform(X, y)
     assert X_t.shape[1] == 1
 
 
From ab8789fa5cabb6d34ddaaed5a412c584118a8bdc Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sun, 10 Jan 2021 17:32:48 -0500
Subject: [PATCH 12/98] fix lsa and text featurizer

---
 .../transformers/preprocessing/lsa.py         |  3 +-
 .../preprocessing/text_featurizer.py          | 16 ++++----
 evalml/tests/component_tests/test_lsa.py      | 19 +++++----
 .../component_tests/test_text_featurizer.py   | 40 ++++++++++---------
 4 files changed, 44 insertions(+), 34 deletions(-)

diff --git a/evalml/pipelines/components/transformers/preprocessing/lsa.py b/evalml/pipelines/components/transformers/preprocessing/lsa.py
index 6bc2a7e9f4..ce1eb658c4 100644
--- a/evalml/pipelines/components/transformers/preprocessing/lsa.py
+++ b/evalml/pipelines/components/transformers/preprocessing/lsa.py
@@ -49,7 +49,7 @@ def transform(self, X, y=None):
             y (ww.DataColumn, pd.Series, optional): Ignored.
 
         Returns:
-            pd.DataFrame: Transformed X. The original column is removed and replaced with two columns of the
+            ww.DataTable: Transformed X. The original column is removed and replaced with two columns of the
                           format `LSA(original_column_name)[feature_number]`, where `feature_number` is 0 or 1.
         """
         X = _convert_to_woodwork_structure(X)
@@ -64,4 +64,5 @@ def transform(self, X, y=None):
             X_t['LSA({})[0]'.format(col)] = pd.Series(transformed[:, 0], index=X.index)
             X_t['LSA({})[1]'.format(col)] = pd.Series(transformed[:, 1], index=X.index)
         X_t = X_t.drop(columns=text_columns)
+        X_t = _convert_to_woodwork_structure(X_t)
         return X_t
diff --git a/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py b/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
index 1b4c02d01e..a3fd15e5e3 100644
--- a/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
@@ -66,8 +66,8 @@ def fit(self, X, y=None):
         """Fits component to data
 
         Arguments:
-            X (pd.DataFrame or np.ndarray): the input training data of shape [n_samples, n_features]
-            y (pd.Series, optional): the target training labels of length [n_samples]
+            X (ww.DataTable, pd.DataFrame or np.ndarray): the input training data of shape [n_samples, n_features]
+            y (ww.DataColumn, pd.Series, optional): the target training labels of length [n_samples]
 
         Returns:
             self
@@ -90,11 +90,11 @@ def transform(self, X, y=None):
         """Transforms data X by creating new features using existing text columns
 
         Arguments:
-            X (pd.DataFrame): Data to transform
-            y (pd.Series, optional): Ignored.
+            X (ww.DataTable, pd.DataFrame): Data to transform
+            y (ww.DataColumn, pd.Series, optional): Ignored.
 
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
@@ -106,6 +106,8 @@ def transform(self, X, y=None):
         X_nlp_primitives = ft.calculate_feature_matrix(features=self._features, entityset=es)
         if X_nlp_primitives.isnull().any().any():
             X_nlp_primitives.fillna(0, inplace=True)
-        X_lsa = self._lsa.transform(X[text_columns])
+        X_lsa = self._lsa.transform(X[text_columns]).to_dataframe()
         X_nlp_primitives.set_index(X.index, inplace=True)
-        return pd.concat([X.drop(text_columns, axis=1), X_nlp_primitives, X_lsa], axis=1)
+        X_t = pd.concat([X.drop(text_columns, axis=1), X_nlp_primitives, X_lsa], axis=1)
+        X_t = _convert_to_woodwork_structure(X_t)
+        return X_t
diff --git a/evalml/tests/component_tests/test_lsa.py b/evalml/tests/component_tests/test_lsa.py
index 027cb4c660..d3ac641f56 100644
--- a/evalml/tests/component_tests/test_lsa.py
+++ b/evalml/tests/component_tests/test_lsa.py
@@ -3,6 +3,8 @@
 import numpy as np
 import pandas as pd
 import pytest
+import woodwork as ww
+from pandas.testing import assert_frame_equal
 
 from evalml.pipelines.components import LSA
 
@@ -19,7 +21,7 @@ def test_lsa_only_text(text_df):
     X_t = lsa.transform(X)
     assert set(X_t.columns) == expected_col_names
     assert len(X_t.columns) == 4
-    assert X_t.dtypes.all() == np.float64
+    assert set(X_t.logical_types.values()) == {ww.logical_types.Double}
 
 
 def test_lsa_with_nontext(text_df):
@@ -36,7 +38,7 @@ def test_lsa_with_nontext(text_df):
     X_t = lsa.transform(X)
     assert set(X_t.columns) == expected_col_names
     assert len(X_t.columns) == 5
-    assert X_t.dtypes.all() == np.float64
+    assert set(X_t.logical_types.values()) == {ww.logical_types.Double}
 
 
 def test_lsa_no_text():
@@ -62,7 +64,7 @@ def test_some_missing_col_names(text_df, caplog):
     X_t = lsa.transform(X)
     assert set(X_t.columns) == expected_col_names
     assert len(X_t.columns) == 4
-    assert X_t.dtypes.all() == np.float64
+    assert set(X_t.logical_types.values()) == {ww.logical_types.Double}
 
 
 def test_all_missing_col_names(text_df):
@@ -115,7 +117,7 @@ def test_index_col_names():
     X_t = lsa.transform(X)
     assert set(X_t.columns) == expected_col_names
     assert len(X_t.columns) == 4
-    assert X_t.dtypes.all() == np.float64
+    assert set(X_t.logical_types.values()) == {ww.logical_types.Double}
 
 
 def test_int_col_names():
@@ -136,7 +138,7 @@ def test_int_col_names():
     X_t = lsa.transform(X)
     assert set(X_t.columns) == expected_col_names
     assert len(X_t.columns) == 4
-    assert X_t.dtypes.all() == np.float64
+    assert set(X_t.logical_types.values()) == {ww.logical_types.Double}
 
 
 def test_lsa_output():
@@ -150,10 +152,13 @@ def test_lsa_output():
     expected_features = [[0.832, 0.],
                          [0., 1.],
                          [0.832, 0.]]
+    expected_features = pd.DataFrame([[0.832, 0.],
+                                      [0., 1.],
+                                      [0.832, 0.]], columns=["LSA(lsa)[0]", "LSA(lsa)[1]"])
     X_t = lsa.transform(X)
     cols = [col for col in X_t.columns if 'LSA' in col]
     features = X_t[cols]
-    np.testing.assert_almost_equal(features, expected_features, decimal=3)
+    assert_frame_equal(expected_features, features.to_dataframe(), atol=1e-3)
 
 
 def test_lsa_with_custom_indices(text_df):
@@ -162,4 +167,4 @@ def test_lsa_with_custom_indices(text_df):
     lsa = LSA(text_columns=['col_1', 'col_2'])
     lsa.fit(X)
     X_t = lsa.transform(X)
-    assert not X_t.isnull().any().any()
+    assert not X_t.to_dataframe().isnull().any().any()
diff --git a/evalml/tests/component_tests/test_text_featurizer.py b/evalml/tests/component_tests/test_text_featurizer.py
index f713df2500..dbb60257a9 100644
--- a/evalml/tests/component_tests/test_text_featurizer.py
+++ b/evalml/tests/component_tests/test_text_featurizer.py
@@ -3,6 +3,8 @@
 import numpy as np
 import pandas as pd
 import pytest
+import woodwork as ww
+from pandas.testing import assert_frame_equal, assert_series_equal
 
 from evalml.pipelines.components import TextFeaturizer
 
@@ -25,7 +27,7 @@ def test_featurizer_only_text(text_df):
     X_t = tf.transform(X)
     assert set(X_t.columns) == expected_col_names
     assert len(X_t.columns) == 10
-    assert X_t.dtypes.all() == np.float64
+    assert set(X_t.logical_types.values()) == {ww.logical_types.Double}
 
 
 def test_featurizer_with_nontext(text_df):
@@ -48,7 +50,7 @@ def test_featurizer_with_nontext(text_df):
     X_t = tf.transform(X)
     assert set(X_t.columns) == expected_col_names
     assert len(X_t.columns) == 11
-    assert X_t.dtypes.all() == np.float64
+    assert set(X_t.logical_types.values()) == {ww.logical_types.Double}
 
 
 def test_featurizer_no_text():
@@ -80,7 +82,7 @@ def test_some_missing_col_names(text_df, caplog):
     X_t = tf.transform(X)
     assert set(X_t.columns) == expected_col_names
     assert len(X_t.columns) == 10
-    assert X_t.dtypes.all() == np.float64
+    assert set(X_t.logical_types.values()) == {ww.logical_types.Double}
 
 
 def test_all_missing_col_names(text_df):
@@ -124,7 +126,7 @@ def test_no_null_output():
     tf = TextFeaturizer(text_columns=['col_1', 'col_2'])
     tf.fit(X)
     X_t = tf.transform(X)
-    assert not X_t.isnull().any().any()
+    assert not X_t.to_dataframe().isnull().any().any()
 
 
 def test_index_col_names():
@@ -147,7 +149,7 @@ def test_index_col_names():
     X_t = tf.transform(X)
     assert set(X_t.columns) == expected_col_names
     assert len(X_t.columns) == 10
-    assert X_t.dtypes.all() == np.float64
+    assert set(X_t.logical_types.values()) == {ww.logical_types.Double}
 
 
 def test_int_col_names():
@@ -174,7 +176,7 @@ def test_int_col_names():
     X_t = tf.transform(X)
     assert set(X_t.columns) == expected_col_names
     assert len(X_t.columns) == 10
-    assert X_t.dtypes.all() == np.float64
+    assert set(X_t.logical_types.values()) == {ww.logical_types.Double}
 
 
 def test_output_null():
@@ -189,7 +191,7 @@ def test_output_null():
     tf = TextFeaturizer(text_columns=['col_1', 'col_2'])
     tf.fit(X)
     X_t = tf.transform(X)
-    assert not X_t.isnull().any().any()
+    assert not X_t.to_dataframe().isnull().any().any()
 
 
 def test_diversity_primitive_output():
@@ -200,10 +202,10 @@ def test_diversity_primitive_output():
     tf = TextFeaturizer(text_columns=['diverse'])
     tf.fit(X)
 
-    expected_features = [1.0, 0.5, 0.75]
+    expected_features = pd.Series([1.0, 0.5, 0.75], name='DIVERSITY_SCORE(diverse)')
     X_t = tf.transform(X)
-    features = X_t['DIVERSITY_SCORE(diverse)']
-    np.testing.assert_almost_equal(features, expected_features)
+    features = X_t['DIVERSITY_SCORE(diverse)'].to_series()
+    assert_series_equal(expected_features, features)
 
 
 def test_lsa_primitive_output():
@@ -214,13 +216,13 @@ def test_lsa_primitive_output():
     tf = TextFeaturizer(text_columns=['lsa'])
     tf.fit(X)
 
-    expected_features = [[0.832, 0.],
-                         [0., 1.],
-                         [0.832, 0.]]
+    expected_features = pd.DataFrame([[0.832, 0.],
+                                      [0., 1.],
+                                      [0.832, 0.]], columns=['LSA(lsa)[0]', 'LSA(lsa)[1]'])
     X_t = tf.transform(X)
     cols = [col for col in X_t.columns if 'LSA' in col]
     features = X_t[cols]
-    np.testing.assert_almost_equal(features, expected_features, decimal=3)
+    assert_frame_equal(expected_features, features.to_dataframe(), atol=1e-3)
 
 
 def test_mean_characters_primitive_output():
@@ -231,10 +233,10 @@ def test_mean_characters_primitive_output():
     tf = TextFeaturizer(text_columns=['mean_characters'])
     tf.fit(X)
 
-    expected_features = [4.11764705882352, 3.45, 3.72727272727]
+    expected_features = pd.Series([4.11764705882352, 3.45, 3.72727272727], name='MEAN_CHARACTERS_PER_WORD(mean_characters)')
     X_t = tf.transform(X)
     features = X_t['MEAN_CHARACTERS_PER_WORD(mean_characters)']
-    np.testing.assert_almost_equal(features, expected_features)
+    assert_series_equal(expected_features, features.to_series())
 
 
 def test_polarity_primitive_output():
@@ -245,10 +247,10 @@ def test_polarity_primitive_output():
     tf = TextFeaturizer(text_columns=['polarity'])
     tf.fit(X)
 
-    expected_features = [0.0, -0.214, 0.602]
+    expected_features = pd.Series([0.0, -0.214, 0.602], name='POLARITY_SCORE(polarity)')
     X_t = tf.transform(X)
     features = X_t['POLARITY_SCORE(polarity)']
-    np.testing.assert_almost_equal(features, expected_features)
+    assert_series_equal(expected_features, features.to_series())
 
 
 def test_featurizer_with_custom_indices(text_df):
@@ -257,4 +259,4 @@ def test_featurizer_with_custom_indices(text_df):
     tf = TextFeaturizer(text_columns=['col_1', 'col_2'])
     tf.fit(X)
     X_t = tf.transform(X)
-    assert not X_t.isnull().any().any()
+    assert not X_t.to_dataframe().isnull().any().any()

From 0865d322860f382d2685b0825fd6144a261f5660 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Mon, 11 Jan 2021 11:28:08 -0500
Subject: [PATCH 13/98] update featuretools

---
 .../classifiers/baseline_classifier.py        | 14 ++++++-----
 .../transformers/column_selectors.py          | 23 ++++++++++---------
 .../preprocessing/datetime_featurizer.py      | 10 ++++----
 .../preprocessing/featuretools.py             |  8 ++++++-
 .../components/transformers/transformer.py    | 21 +++++++++--------
 .../test_baseline_classifier.py               |  8 +++----
 .../test_datetime_featurizer.py               | 12 +++++-----
 .../component_tests/test_featuretools.py      | 16 +++++++------
 8 files changed, 62 insertions(+), 50 deletions(-)

diff --git a/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py b/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
index 81dbfb897e..5ea99f1953 100644
--- a/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
@@ -64,11 +64,12 @@ def predict(self, X):
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         strategy = self.parameters["strategy"]
         if strategy == "mode":
-            return pd.Series([self._mode] * len(X))
+            predictions = pd.Series([self._mode] * len(X))
         elif strategy == "random":
-            return self.random_state.choice(self._classes, len(X))
+            predictions = self.random_state.choice(self._classes, len(X))
         else:
-            return self.random_state.choice(self._classes, len(X), p=self._percentage_freq)
+            predictions = self.random_state.choice(self._classes, len(X), p=self._percentage_freq)
+        return _convert_to_woodwork_structure(predictions)
 
     def predict_proba(self, X):
         X = _convert_to_woodwork_structure(X)
@@ -77,13 +78,14 @@ def predict_proba(self, X):
         if strategy == "mode":
             mode_index = self._classes.index(self._mode)
             proba_arr = np.array([[1.0 if i == mode_index else 0.0 for i in range(self._num_unique)]] * len(X))
-            return pd.DataFrame(proba_arr, columns=self._classes)
+            predictions = pd.DataFrame(proba_arr, columns=self._classes)
         elif strategy == "random":
             proba_arr = np.array([[1.0 / self._num_unique for i in range(self._num_unique)]] * len(X))
-            return pd.DataFrame(proba_arr, columns=self._classes)
+            predictions = pd.DataFrame(proba_arr, columns=self._classes)
         else:
             proba_arr = np.array([[self._percentage_freq[i] for i in range(self._num_unique)]] * len(X))
-            return pd.DataFrame(proba_arr, columns=self._classes)
+            predictions = pd.DataFrame(proba_arr, columns=self._classes)
+        return _convert_to_woodwork_structure(predictions)
 
     @property
     def feature_importance(self):
diff --git a/evalml/pipelines/components/transformers/column_selectors.py b/evalml/pipelines/components/transformers/column_selectors.py
index 1e176c8f1d..a78e0200be 100644
--- a/evalml/pipelines/components/transformers/column_selectors.py
+++ b/evalml/pipelines/components/transformers/column_selectors.py
@@ -48,11 +48,11 @@ def fit(self, X, y=None):
         """'Fits' the transformer by checking if the column names are present in the dataset.
 
         Arguments:
-            X (pd.DataFrame): Data to check.
-            y (pd.Series, optional): Targets.
+            X (ww.DataTable, pd.DataFrame): Data to check.
+            y (ww.DataColumn, pd.Series, optional): Targets.
 
         Returns:
-            None.
+            self
         """
 
         self._check_input_for_columns(X)
@@ -64,7 +64,8 @@ def transform(self, X, y=None):
         self._check_input_for_columns(X)
 
         cols = self.parameters.get("columns") or []
-        return self._modify_columns(cols, X, y)
+        cols = self._modify_columns(cols, X, y)
+        return _convert_to_woodwork_structure(cols)
 
     def fit_transform(self, X, y=None):
         """Fit transformer to data, then transform data.
@@ -74,7 +75,7 @@ def fit_transform(self, X, y=None):
             y (pd.Series, optional): Targets.
 
         Returns:
-            pd.DataFrame: Transformed X.
+            ww.DataTable: Transformed X.
         """
 
         # transform method already calls fit under the hood.
@@ -95,11 +96,11 @@ def transform(self, X, y=None):
         """Transforms data X by dropping columns.
 
         Arguments:
-            X (pd.DataFrame): Data to transform.
-            y (pd.Series, optional): Targets.
+            X (ww.DataTable, pd.DataFrame): Data to transform.
+            y (ww.DataColumn, pd.Series, optional): Targets.
 
         Returns:
-            pd.DataFrame: Transformed X.
+            ww.DataTable: Transformed X.
         """
         return super().transform(X, y)
 
@@ -117,10 +118,10 @@ def transform(self, X, y=None):
         """Transforms data X by selecting columns.
 
         Arguments:
-            X (pd.DataFrame): Data to transform.
-            y (pd.Series, optional): Targets.
+            X (ww.DataTable, pd.DataFrame): Data to transform.
+            y (ww.DataColumn, pd.Series, optional): Targets.
 
         Returns:
-            pd.DataFrame: Transformed X.
+            ww.DataTable: Transformed X.
         """
         return super().transform(X, y)
diff --git a/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py b/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
index 2678deaa81..17b296d7e8 100644
--- a/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
@@ -83,11 +83,11 @@ def transform(self, X, y=None):
         """Transforms data X by creating new features using existing DateTime columns, and then dropping those DateTime columns
 
         Arguments:
-            X (pd.DataFrame): Data to transform
-            y (pd.Series, optional): Ignored.
+            X (ww.DataTable, pd.DataFrame): Data to transform
+            y (ww.DataColumn, pd.Series, optional): Ignored.
 
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
@@ -111,7 +111,7 @@ def get_feature_names(self):
         """Gets the categories of each datetime feature.
 
         Returns:
-           Dict. Each key-value pair is a column name and a dictionary mapping the unique feature values to their
-           integer encoding.
+           Dictionary, where each key-value pair is a column name and a dictionary
+           mapping the unique feature values to their integer encoding.
         """
         return self._categories
diff --git a/evalml/pipelines/components/transformers/preprocessing/featuretools.py b/evalml/pipelines/components/transformers/preprocessing/featuretools.py
index 90f3af9edb..ecc1d45263 100644
--- a/evalml/pipelines/components/transformers/preprocessing/featuretools.py
+++ b/evalml/pipelines/components/transformers/preprocessing/featuretools.py
@@ -46,6 +46,9 @@ def fit(self, X, y=None):
         Arguments:
             X (ww.DataTable, pd.DataFrame, np.array): The input data to transform, of shape [n_samples, n_features]
             y (ww.DataColumn, pd.Series, np.ndarray, optional): The target training data of length [n_samples]
+        
+        Returns:
+            self
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
@@ -61,10 +64,13 @@ def transform(self, X, y=None):
 
         Arguments:
             X (ww.DataTable, pd.DataFrame or np.ndarray): The input training data to transform. Has shape [n_samples, n_features]
+            y (ww.DataColumn, pd.Series, optional): Ignored.
+        Returns:
+            ww.DataTable: Feature matrix
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         X.columns = X.columns.astype(str)
         es = self._make_entity_set(X)
         feature_matrix = calculate_feature_matrix(features=self.features, entityset=es)
-        return feature_matrix
+        return _convert_to_woodwork_structure(feature_matrix)
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 0ecd28c19a..71eee3d332 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -25,27 +25,30 @@ def transform(self, X, y=None):
         """Transforms data X
 
         Arguments:
-            X (pd.DataFrame): Data to transform
-            y (pd.Series, optional): Target data
+            X (ww.DataTable, pd.DataFrame): Data to transform
+            y (ww.DataColumn, pd.Series, optional): Target data
+
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
         try:
             X_t = self._component_obj.transform(X)
         except AttributeError:
             raise MethodPropertyNotFoundError("Transformer requires a transform method or a component_obj that implements transform")
-        if not isinstance(X_t, pd.DataFrame) and isinstance(X, pd.DataFrame):
-            return _convert_to_woodwork_structure(pd.DataFrame(X_t, columns=X.columns, index=X.index))
+        # if isinstance(X, pd.DataFrame):
+            # return _convert_to_woodwork_structure(pd.DataFrame(X_t, columns=X.columns, index=X.index))
+
         return _convert_to_woodwork_structure(X_t)
 
     def fit_transform(self, X, y=None):
         """Fits on X and transforms X
 
         Arguments:
-            X (pd.DataFrame): Data to fit and transform
-            y (pd. DataFrame): Target data
+            X (ww.DataTable, pd.DataFrame): Data to fit and transform
+            y (ww.DataColumn, pd.Series): Target data
+
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
         try:
             X_t = self._component_obj.fit_transform(X, y)
@@ -55,6 +58,4 @@ def fit_transform(self, X, y=None):
                 X_t = self.transform(X, y)
             except MethodPropertyNotFoundError as e:
                 raise e
-
-        # return _convert_to_woodwork_structure(pd.DataFrame(X_t, columns=X.columns, index=X.index))
         return _convert_to_woodwork_structure(X_t)
diff --git a/evalml/tests/component_tests/test_baseline_classifier.py b/evalml/tests/component_tests/test_baseline_classifier.py
index 3333e49fed..593c241ac7 100644
--- a/evalml/tests/component_tests/test_baseline_classifier.py
+++ b/evalml/tests/component_tests/test_baseline_classifier.py
@@ -27,12 +27,12 @@ def test_baseline_y_is_None(X_y_binary):
 
 
 @pytest.mark.parametrize('data_type', ['pd', 'ww'])
-def test_baseline_binary_mode(data_type, X_y_binary):
+def test_baseline_binary_mode(data_type, make_data_type):
     X = pd.DataFrame({'one': [1, 2, 3, 4], 'two': [2, 3, 4, 5], 'three': [1, 2, 3, 4]})
     y = pd.Series([10, 11, 10, 10])
-    if data_type == 'ww':
-        X = ww.DataTable(X)
-        y = ww.DataColumn(y)
+    X = make_data_type(data_type, X)
+    y = make_data_type(data_type, y)
+
     clf = BaselineClassifier(strategy="mode")
     clf.fit(X, y)
     assert clf.classes_ == [10, 11]
diff --git a/evalml/tests/component_tests/test_datetime_featurizer.py b/evalml/tests/component_tests/test_datetime_featurizer.py
index 5294cdfc0e..50e93e22b5 100644
--- a/evalml/tests/component_tests/test_datetime_featurizer.py
+++ b/evalml/tests/component_tests/test_datetime_featurizer.py
@@ -1,6 +1,7 @@
 import numpy as np
 import pandas as pd
 import pytest
+from pandas.testing import assert_frame_equal
 
 from evalml.pipelines.components import DateTimeFeaturizer
 
@@ -30,7 +31,7 @@ def test_datetime_featurizer_encodes_as_ints():
     feature_names = {'date_month': {'April': 3, 'March': 2, 'July': 6, 'August': 7, 'January': 0},
                      'date_day_of_week': {'Sunday': 0, 'Wednesday': 3, 'Tuesday': 2, 'Monday': 1, 'Friday': 5}
                      }
-    pd.testing.assert_frame_equal(expected, X_transformed_df.to_dataframe())
+    assert_frame_equal(expected, X_transformed_df.to_dataframe())
     assert dt.get_feature_names() == feature_names
 
     # Test that changing encode_as_categories to True only changes the dtypes but not the values
@@ -39,8 +40,7 @@ def test_datetime_featurizer_encodes_as_ints():
     expected["date_month"] = pd.Categorical([3, 2, 6, 7, 0])
     expected["date_day_of_week"] = pd.Categorical([0, 3, 2, 1, 5])
 
-    # import pdb; pdb.set_trace()
-    pd.testing.assert_frame_equal(expected, X_transformed_df.to_dataframe())
+    assert_frame_equal(expected, X_transformed_df.to_dataframe())
     assert dt_with_cats.get_feature_names() == feature_names
 
     # Test that sequential calls to the same DateTimeFeaturizer work as expected by using the first dt we defined
@@ -50,7 +50,7 @@ def test_datetime_featurizer_encodes_as_ints():
                              "date_month": pd.Series([3, 2, 7], dtype="Int64"),
                              "date_day_of_week": pd.Series([5, 3, 1], dtype="Int64"),
                              "date_hour": pd.Series([0, 0, 0], dtype="Int64")})
-    pd.testing.assert_frame_equal(expected, X_transformed_df.to_dataframe())
+    assert_frame_equal(expected, X_transformed_df.to_dataframe())
     assert dt.get_feature_names() == {'date_month': {'April': 3, 'March': 2, 'August': 7},
                                       'date_day_of_week': {'Friday': 5, 'Wednesday': 3, 'Monday': 1}}
 
@@ -109,7 +109,7 @@ def test_datetime_featurizer_no_features_to_extract():
     expected["numerical"] = expected["numerical"].astype("Int64")
     datetime_transformer.fit(X)
     transformed = datetime_transformer.transform(X).to_dataframe()
-    pd.testing.assert_frame_equal(expected, transformed)
+    assert_frame_equal(expected, transformed)
     assert datetime_transformer.get_feature_names() == {}
 
 
@@ -128,7 +128,7 @@ def test_datetime_featurizer_no_datetime_cols():
     expected = X.astype("Int64")
     datetime_transformer.fit(X)
     transformed = datetime_transformer.transform(X).to_dataframe()
-    pd.testing.assert_frame_equal(expected, transformed)
+    assert_frame_equal(expected, transformed)
     assert datetime_transformer.get_feature_names() == {}
 
 
diff --git a/evalml/tests/component_tests/test_featuretools.py b/evalml/tests/component_tests/test_featuretools.py
index 1807dbe21e..74437be40d 100644
--- a/evalml/tests/component_tests/test_featuretools.py
+++ b/evalml/tests/component_tests/test_featuretools.py
@@ -4,6 +4,7 @@
 import pandas as pd
 import pytest
 import woodwork as ww
+from pandas.testing import assert_frame_equal
 
 from evalml.pipelines.components import DFSTransformer
 
@@ -27,13 +28,14 @@ def test_numeric_columns(X_y_multi):
 
 @patch('evalml.pipelines.components.transformers.preprocessing.featuretools.dfs')
 @patch('evalml.pipelines.components.transformers.preprocessing.featuretools.calculate_feature_matrix')
-def test_index(mock_dfs, mock_calculate_feature_matrix, X_y_multi):
+def test_featuretools_index(mock_calculate_feature_matrix, mock_dfs, X_y_multi):
     X, y = X_y_multi
     X_pd = pd.DataFrame(X)
     X_new_index = X_pd.copy()
     index = [i for i in range(len(X))]
     new_index = [i * 2 for i in index]
     X_new_index['index'] = new_index
+    mock_calculate_feature_matrix.return_value = pd.DataFrame({})
 
     # check if _make_entity_set keeps the intended index
     feature = DFSTransformer()
@@ -61,13 +63,13 @@ def test_transform(X_y_binary, X_y_multi, X_y_regression):
         X_pd.columns = X_pd.columns.astype(str)
         es = ft.EntitySet()
         es = es.entity_from_dataframe(entity_id="X", dataframe=X_pd, index='index', make_index=True)
-        matrix, features = ft.dfs(entityset=es, target_entity="X")
+        feature_matrix, features = ft.dfs(entityset=es, target_entity="X")
 
         feature = DFSTransformer()
         feature.fit(X)
-        X_feature_matrix = feature.transform(X)
+        X_t = feature.transform(X)
 
-        pd.testing.assert_frame_equal(matrix, X_feature_matrix)
+        assert_frame_equal(feature_matrix, X_t.to_dataframe())
         assert features == feature.features
 
         feature.fit(X, y)
@@ -89,10 +91,10 @@ def test_transform_subset(X_y_binary, X_y_multi, X_y_regression):
 
         es = ft.EntitySet()
         es = es.entity_from_dataframe(entity_id="X", dataframe=X_transform, index='index', make_index=True)
-        matrix, features = ft.dfs(entityset=es, target_entity="X")
+        feature_matrix, features = ft.dfs(entityset=es, target_entity="X")
 
         feature = DFSTransformer()
         feature.fit(X_fit)
-        X_feature_matrix = feature.transform(X_transform)
+        X_t = feature.transform(X_transform)
 
-        pd.testing.assert_frame_equal(matrix, X_feature_matrix)
+        assert_frame_equal(feature_matrix, X_t.to_dataframe())

From c99808b98c37bcb164a97de01ad2b7a4f292c200 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Mon, 11 Jan 2021 15:15:17 -0500
Subject: [PATCH 14/98] update col selector transformer

---
 .../transformers/column_selectors.py          | 11 ---
 .../preprocessing/featuretools.py             |  2 +-
 .../components/transformers/transformer.py    |  2 -
 .../test_baseline_classifier.py               |  1 -
 .../test_column_selector_transformers.py      | 86 ++++++++-----------
 5 files changed, 36 insertions(+), 66 deletions(-)

diff --git a/evalml/pipelines/components/transformers/column_selectors.py b/evalml/pipelines/components/transformers/column_selectors.py
index a78e0200be..0fbea2c0de 100644
--- a/evalml/pipelines/components/transformers/column_selectors.py
+++ b/evalml/pipelines/components/transformers/column_selectors.py
@@ -54,7 +54,6 @@ def fit(self, X, y=None):
         Returns:
             self
         """
-
         self._check_input_for_columns(X)
         return self
 
@@ -68,16 +67,6 @@ def transform(self, X, y=None):
         return _convert_to_woodwork_structure(cols)
 
     def fit_transform(self, X, y=None):
-        """Fit transformer to data, then transform data.
-
-        Arguments:
-            X (pd.DataFrame): Data to transform.
-            y (pd.Series, optional): Targets.
-
-        Returns:
-            ww.DataTable: Transformed X.
-        """
-
         # transform method already calls fit under the hood.
         self.fit(X, y)
         return self.transform(X, y)
diff --git a/evalml/pipelines/components/transformers/preprocessing/featuretools.py b/evalml/pipelines/components/transformers/preprocessing/featuretools.py
index ecc1d45263..ebcea8fa5d 100644
--- a/evalml/pipelines/components/transformers/preprocessing/featuretools.py
+++ b/evalml/pipelines/components/transformers/preprocessing/featuretools.py
@@ -46,7 +46,7 @@ def fit(self, X, y=None):
         Arguments:
             X (ww.DataTable, pd.DataFrame, np.array): The input data to transform, of shape [n_samples, n_features]
             y (ww.DataColumn, pd.Series, np.ndarray, optional): The target training data of length [n_samples]
-        
+
         Returns:
             self
         """
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 71eee3d332..14616ec06f 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -1,5 +1,3 @@
-import pandas as pd
-
 from evalml.exceptions import MethodPropertyNotFoundError
 from evalml.model_family import ModelFamily
 from evalml.pipelines.components import ComponentBase
diff --git a/evalml/tests/component_tests/test_baseline_classifier.py b/evalml/tests/component_tests/test_baseline_classifier.py
index 593c241ac7..ddd3c02b43 100644
--- a/evalml/tests/component_tests/test_baseline_classifier.py
+++ b/evalml/tests/component_tests/test_baseline_classifier.py
@@ -1,7 +1,6 @@
 import numpy as np
 import pandas as pd
 import pytest
-import woodwork as ww
 
 from evalml.model_family import ModelFamily
 from evalml.pipelines.components import BaselineClassifier
diff --git a/evalml/tests/component_tests/test_column_selector_transformers.py b/evalml/tests/component_tests/test_column_selector_transformers.py
index a625d6fa31..2cec634b43 100644
--- a/evalml/tests/component_tests/test_column_selector_transformers.py
+++ b/evalml/tests/component_tests/test_column_selector_transformers.py
@@ -1,6 +1,7 @@
 import numpy as np
 import pandas as pd
 import pytest
+from pandas.testing import assert_frame_equal
 
 from evalml.pipelines.components import DropColumns, SelectColumns
 
@@ -24,63 +25,63 @@ def test_column_transformer_init(class_to_test):
 def test_column_transformer_empty_X(class_to_test):
     X = pd.DataFrame()
     transformer = class_to_test(columns=[])
-    assert transformer.transform(X).equals(X)
+    assert_frame_equal(X, transformer.transform(X).to_dataframe())
 
     transformer = class_to_test(columns=[])
-    assert transformer.fit_transform(X).equals(X)
+    assert_frame_equal(X, transformer.fit_transform(X).to_dataframe())
 
     transformer = class_to_test(columns=["not in data"])
     with pytest.raises(ValueError, match="'not in data' not found in input data"):
         transformer.fit(X)
 
     transformer = class_to_test(columns=list(X.columns))
-    assert transformer.transform(X).empty
+    assert transformer.transform(X).to_dataframe().empty
 
 
 @pytest.mark.parametrize("class_to_test,checking_functions",
-                         [(DropColumns, [lambda df, X: df.equals(X),
-                                         lambda df, X: df.equals(X),
-                                         lambda df, X: df.equals(X.drop(columns=["one"])),
-                                         lambda df, X: df.empty]),
-                          (SelectColumns, [lambda df, X: df.empty,
-                                           lambda df, X: df.empty,
-                                           lambda df, X: df.equals(X[["one"]]),
-                                           lambda df, X: df.equals(X)])
+                         [(DropColumns, [lambda X, X_t: X_t.equals(X.astype("Int64")),
+                                         lambda X, X_t: X_t.equals(X.astype("Int64")),
+                                         lambda X, X_t: X_t.equals(X.drop(columns=["one"]).astype("Int64")),
+                                         lambda X, X_t: X_t.empty]),
+                          (SelectColumns, [lambda X, X_t: X_t.empty,
+                                           lambda X, X_t: X_t.empty,
+                                           lambda X, X_t: X_t.equals(X[["one"]].astype("Int64")),
+                                           lambda X, X_t: X_t.equals(X.astype("Int64"))])
                           ])
 def test_column_transformer_transform(class_to_test, checking_functions):
     X = pd.DataFrame({'one': [1, 2, 3, 4], 'two': [2, 3, 4, 5], 'three': [1, 2, 3, 4]})
     check1, check2, check3, check4 = checking_functions
 
     transformer = class_to_test(columns=None)
-    assert check1(transformer.transform(X), X)
+    assert check1(X, transformer.transform(X).to_dataframe())
 
     transformer = class_to_test(columns=[])
-    assert check2(transformer.transform(X), X)
+    assert check2(X, transformer.transform(X).to_dataframe())
 
     transformer = class_to_test(columns=["one"])
-    assert check3(transformer.transform(X), X)
+    assert check3(X, transformer.transform(X).to_dataframe())
 
     transformer = class_to_test(columns=list(X.columns))
-    assert check4(transformer.transform(X), X)
+    assert check4(X, transformer.transform(X).to_dataframe())
 
 
 @pytest.mark.parametrize("class_to_test,checking_functions",
-                         [(DropColumns, [lambda df, X: df.equals(X),
-                                         lambda df, X: df.equals(X.drop(columns=["one"])),
-                                         lambda df, X: df.empty]),
-                          (SelectColumns, [lambda df, X: df.empty,
-                                           lambda df, X: df.equals(X[["one"]]),
-                                           lambda df, X: df.equals(X)])
+                         [(DropColumns, [lambda X, X_t: X_t.equals(X.astype("Int64")),
+                                         lambda X, X_t: X_t.equals(X.drop(columns=["one"]).astype("Int64")),
+                                         lambda X, X_t: X_t.empty]),
+                          (SelectColumns, [lambda X, X_t: X_t.empty,
+                                           lambda X, X_t: X_t.equals(X[["one"]].astype("Int64")),
+                                           lambda X, X_t: X_t.equals(X.astype("Int64"))])
                           ])
 def test_column_transformer_fit_transform(class_to_test, checking_functions):
     X = pd.DataFrame({'one': [1, 2, 3, 4], 'two': [2, 3, 4, 5], 'three': [1, 2, 3, 4]})
     check1, check2, check3 = checking_functions
 
-    assert check1(class_to_test(columns=[]).fit_transform(X), X)
+    assert check1(X, class_to_test(columns=[]).fit_transform(X).to_dataframe())
 
-    assert check2(class_to_test(columns=["one"]).fit_transform(X), X)
+    assert check2(X, class_to_test(columns=["one"]).fit_transform(X).to_dataframe())
 
-    assert check3(class_to_test(columns=list(X.columns)).fit_transform(X), X)
+    assert check3(X, class_to_test(columns=list(X.columns)).fit_transform(X).to_dataframe())
 
 
 @pytest.mark.parametrize("class_to_test", [DropColumns, SelectColumns])
@@ -105,39 +106,22 @@ def test_drop_column_transformer_input_invalid_col_name(class_to_test):
 
 
 @pytest.mark.parametrize("class_to_test,answers",
-                         [(DropColumns, [np.array([[0, 2, 3], [4, 6, 7], [8, 10, 11]]),
-                                         np.array([[], [], []]),
-                                         np.arange(12).reshape(3, 4)]),
-                          (SelectColumns, [np.array([[1], [5], [9]]),
-                                           np.arange(12).reshape(3, 4),
-                                           np.array([[], [], []])])
+                         [(DropColumns, [pd.DataFrame([[0, 2, 3], [4, 6, 7], [8, 10, 11]], columns=[0, 2, 3], dtype="Int64"),
+                                         pd.DataFrame([[], [], []], dtype="Int64"),
+                                         pd.DataFrame(np.arange(12).reshape(3, 4), dtype="Int64")]),
+                          (SelectColumns, [pd.DataFrame([[1], [5], [9]], columns=[1], dtype="Int64"),
+                                           pd.DataFrame(np.arange(12).reshape(3, 4), dtype="Int64"),
+                                           pd.DataFrame([[], [], []], dtype="Int64")])
                           ])
-def test_column_transformer_numpy(class_to_test, answers):
+def test_column_transformer_int_col_names(class_to_test, answers):
     X = np.arange(12).reshape(3, 4)
     answer1, answer2, answer3 = answers
 
     transformer = class_to_test(columns=[1])
-    np.testing.assert_allclose(transformer.transform(X).values, answer1)
+    assert_frame_equal(answer1, transformer.transform(X).to_dataframe())
 
     transformer = class_to_test(columns=[0, 1, 2, 3])
-    np.testing.assert_allclose(transformer.transform(X).values, answer2)
+    assert_frame_equal(answer2, transformer.transform(X).to_dataframe())
 
     transformer = class_to_test(columns=[])
-    np.testing.assert_allclose(transformer.transform(X).values, answer3)
-
-
-@pytest.mark.parametrize("class_to_test,answers",
-                         [(DropColumns, [np.array([[0, 2, 3], [4, 6, 7], [8, 10, 11]]),
-                                         np.array([[], [], []])]),
-                          (SelectColumns, [np.array([[1], [5], [9]]),
-                                           np.arange(12).reshape(3, 4)])
-                          ])
-def test_column_transformer_int_col_names(class_to_test, answers):
-    X = np.arange(12).reshape(3, 4)
-    answer1, answer2 = answers
-
-    transformer = class_to_test(columns=[1])
-    np.testing.assert_allclose(transformer.transform(X).values, answer1)
-
-    transformer = class_to_test(columns=[0, 1, 2, 3])
-    np.testing.assert_allclose(transformer.transform(X).values, answer2)
+    assert_frame_equal(answer3, transformer.transform(X).to_dataframe())

From 704c1c42bc89752de56ace925607fef8d19125f5 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Mon, 11 Jan 2021 16:07:34 -0500
Subject: [PATCH 15/98] update baseline tests

---
 .../test_baseline_classifier.py               | 55 ++++++++++++++-----
 1 file changed, 41 insertions(+), 14 deletions(-)

diff --git a/evalml/tests/component_tests/test_baseline_classifier.py b/evalml/tests/component_tests/test_baseline_classifier.py
index ddd3c02b43..b8d61d0963 100644
--- a/evalml/tests/component_tests/test_baseline_classifier.py
+++ b/evalml/tests/component_tests/test_baseline_classifier.py
@@ -1,6 +1,7 @@
 import numpy as np
 import pandas as pd
 import pytest
+from pandas.testing import assert_frame_equal, assert_series_equal
 
 from evalml.model_family import ModelFamily
 from evalml.pipelines.components import BaselineClassifier
@@ -35,11 +36,14 @@ def test_baseline_binary_mode(data_type, make_data_type):
     clf = BaselineClassifier(strategy="mode")
     clf.fit(X, y)
     assert clf.classes_ == [10, 11]
-    np.testing.assert_allclose(clf.predict(X), np.array([10] * X.shape[0]))
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series(np.array([10] * X.shape[0]), dtype="Int64"), predictions.to_series())
+
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (X.shape[0], 2)
     expected_predicted_proba = pd.DataFrame({10: [1., 1., 1., 1.], 11: [0., 0., 0., 0.]})
-    pd.testing.assert_frame_equal(expected_predicted_proba, predicted_proba)
+    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -49,10 +53,15 @@ def test_baseline_binary_random(X_y_binary):
     clf = BaselineClassifier(strategy="random", random_state=0)
     clf.fit(X, y)
     assert clf.classes_ == [0, 1]
-    np.testing.assert_allclose(clf.predict(X), get_random_state(0).choice(np.unique(y), len(X)))
+
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64"), predictions.to_series())
+
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 2)
-    np.testing.assert_allclose(predicted_proba, np.array([[0.5 for i in range(len(values))]] * len(X)))
+    expected_predicted_proba = pd.DataFrame(np.array([[0.5 for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -64,10 +73,14 @@ def test_baseline_binary_random_weighted(X_y_binary):
     clf = BaselineClassifier(strategy="random_weighted", random_state=0)
     clf.fit(X, y)
     assert clf.classes_ == [0, 1]
-    np.testing.assert_allclose(clf.predict(X), get_random_state(0).choice(np.unique(y), len(X), p=percent_freq))
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64"), predictions.to_series())
+
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 2)
-    np.testing.assert_allclose(predicted_proba, np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
+    expected_predicted_proba = pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -77,11 +90,14 @@ def test_baseline_multiclass_mode():
     clf = BaselineClassifier(strategy="mode")
     clf.fit(X, y)
     assert clf.classes_ == [10, 11, 12]
-    np.testing.assert_allclose(clf.predict(X), np.array([11] * len(X)))
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series(np.array([11] * len(X)), dtype="Int64"), predictions.to_series())
+
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
     expected_predicted_proba = pd.DataFrame({10: [0., 0., 0., 0.], 11: [1., 1., 1., 1.], 12: [0., 0., 0., 0.]})
-    pd.testing.assert_frame_equal(expected_predicted_proba, predicted_proba)
+    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -91,10 +107,13 @@ def test_baseline_multiclass_random(X_y_multi):
     clf = BaselineClassifier(strategy="random", random_state=0)
     clf.fit(X, y)
     assert clf.classes_ == [0, 1, 2]
-    np.testing.assert_allclose(clf.predict(X), get_random_state(0).choice(np.unique(y), len(X)))
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64"), predictions.to_series())
+
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
-    np.testing.assert_allclose(predicted_proba, np.array([[1. / 3 for i in range(len(values))]] * len(X)))
+    assert_frame_equal(pd.DataFrame(np.array([[1. / 3 for i in range(len(values))]] * len(X))), predicted_proba.to_dataframe())
+    # np.testing.assert_allclose(predicted_proba, )
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -106,10 +125,15 @@ def test_baseline_multiclass_random_weighted(X_y_multi):
     clf = BaselineClassifier(strategy="random_weighted", random_state=0)
     clf.fit(X, y)
     assert clf.classes_ == [0, 1, 2]
-    np.testing.assert_allclose(clf.predict(X), get_random_state(0).choice(np.unique(y), len(X), p=percent_freq))
+
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64"), predictions.to_series())
+
+    # np.testing.assert_allclose(clf.predict(X), get_random_state(0).choice(np.unique(y), len(X), p=percent_freq))
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
-    np.testing.assert_allclose(predicted_proba, np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
+    assert_frame_equal(pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X))), predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -119,8 +143,11 @@ def test_baseline_no_mode():
     clf = BaselineClassifier()
     clf.fit(X, y)
     assert clf.classes_ == [0, 1, 2]
-    np.testing.assert_allclose(clf.predict(X), np.array([0] * len(X)))
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series([0] * len(X), dtype="Int64"), predictions.to_series())
+
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
-    np.testing.assert_allclose(predicted_proba, np.array([[1.0 if i == 0 else 0.0 for i in range(3)]] * len(X)))
+    assert_frame_equal(pd.DataFrame(np.array([[1.0 if i == 0 else 0.0 for i in range(3)]] * len(X))), predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))

From c348d793182c67a3d33ae2cb5772907e7787f4ec Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Mon, 11 Jan 2021 16:30:01 -0500
Subject: [PATCH 16/98] update baseline regressor

---
 .../estimators/regressors/baseline_regressor.py           | 3 ++-
 evalml/tests/component_tests/test_baseline_regressor.py   | 8 ++++++--
 2 files changed, 8 insertions(+), 3 deletions(-)

diff --git a/evalml/pipelines/components/estimators/regressors/baseline_regressor.py b/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
index 2b46addd99..e0f7984612 100644
--- a/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
@@ -57,7 +57,8 @@ def fit(self, X, y=None):
     def predict(self, X):
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
-        return pd.Series([self._prediction_value] * len(X))
+        predictions = pd.Series([self._prediction_value] * len(X))
+        return _convert_to_woodwork_structure(predictions)
 
     @property
     def feature_importance(self):
diff --git a/evalml/tests/component_tests/test_baseline_regressor.py b/evalml/tests/component_tests/test_baseline_regressor.py
index 4e4b9ea4e0..e65b60a26e 100644
--- a/evalml/tests/component_tests/test_baseline_regressor.py
+++ b/evalml/tests/component_tests/test_baseline_regressor.py
@@ -1,5 +1,7 @@
 import numpy as np
+import pandas as pd
 import pytest
+from pandas.testing import assert_series_equal
 
 from evalml.model_family import ModelFamily
 from evalml.pipelines.components import BaselineRegressor
@@ -27,7 +29,8 @@ def test_baseline_mean(X_y_regression):
     mean = y.mean()
     clf = BaselineRegressor()
     clf.fit(X, y)
-    np.testing.assert_allclose(clf.predict(X), np.array([mean] * len(X)))
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series([mean] * len(X)), predictions.to_series())
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -36,5 +39,6 @@ def test_baseline_median(X_y_regression):
     median = np.median(y)
     clf = BaselineRegressor(strategy="median")
     clf.fit(X, y)
-    np.testing.assert_allclose(clf.predict(X), np.array([median] * len(X)))
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series([median] * len(X)), predictions.to_series())
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))

From 231523b70ae2f02dbb7dc4b90fbf231909735977 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Mon, 11 Jan 2021 18:31:56 -0500
Subject: [PATCH 17/98] update target encoder

---
 evalml/pipelines/component_graph.py           |  1 +
 .../classifiers/catboost_classifier.py        |  4 +-
 .../classifiers/lightgbm_classifier.py        |  5 +-
 .../regressors/catboost_regressor.py          |  4 +-
 .../time_series_baseline_regressor.py         |  2 +-
 .../component_tests/test_target_encoder.py    | 56 +++++++------------
 .../test_regression.py                        | 16 ++++++
 7 files changed, 46 insertions(+), 42 deletions(-)

diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 2c69eca112..74fc488f5c 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -219,6 +219,7 @@ def _consolidate_inputs(x_inputs, y_input, X, y):
         Returns:
             pd.DataFrame, pd.Series: The X and y transformed values to evaluate a component with
         """
+
         if len(x_inputs) == 0:
             return_x = X
         else:
diff --git a/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py b/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
index 8c9ab2478d..ab979654a6 100644
--- a/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
@@ -70,8 +70,8 @@ def fit(self, X, y=None):
         if y.nunique() <= 2:
             self._label_encoder = LabelEncoder()
             y = pd.Series(self._label_encoder.fit_transform(y))
-        model = self._component_obj.fit(X, y, silent=True, cat_features=cat_cols)
-        return model
+        self._component_obj.fit(X, y, silent=True, cat_features=cat_cols)
+        return self
 
     def predict(self, X):
         X = _convert_to_woodwork_structure(X)
diff --git a/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py b/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py
index 3e62898ac1..a15125433d 100644
--- a/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py
@@ -108,8 +108,9 @@ def predict(self, X):
         predictions = super().predict(X_encoded)
         if self._label_encoder:
             predictions = pd.Series(self._label_encoder.inverse_transform(predictions.astype(np.int64)))
-        return predictions
+        return _convert_to_woodwork_structure(predictions)
 
     def predict_proba(self, X):
         X_encoded = self._encode_categories(X)
-        return super().predict_proba(X_encoded)
+        prediction_proba = super().predict_proba(X_encoded)
+        return _convert_to_woodwork_structure(prediction_proba)
diff --git a/evalml/pipelines/components/estimators/regressors/catboost_regressor.py b/evalml/pipelines/components/estimators/regressors/catboost_regressor.py
index 505cff948a..9ddda1c733 100644
--- a/evalml/pipelines/components/estimators/regressors/catboost_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/catboost_regressor.py
@@ -62,8 +62,8 @@ def fit(self, X, y=None):
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
 
-        model = self._component_obj.fit(X, y, silent=True, cat_features=cat_cols)
-        return model
+        self._component_obj.fit(X, y, silent=True, cat_features=cat_cols)
+        return self
 
     @property
     def feature_importance(self):
diff --git a/evalml/pipelines/components/estimators/regressors/time_series_baseline_regressor.py b/evalml/pipelines/components/estimators/regressors/time_series_baseline_regressor.py
index 812560b157..1b599a4994 100644
--- a/evalml/pipelines/components/estimators/regressors/time_series_baseline_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/time_series_baseline_regressor.py
@@ -61,7 +61,7 @@ def predict(self, X, y=None):
         if self.gap == 0:
             y = y.shift(periods=1)
 
-        return y
+        return _convert_to_woodwork_structure(y)
 
     @property
     def feature_importance(self):
diff --git a/evalml/tests/component_tests/test_target_encoder.py b/evalml/tests/component_tests/test_target_encoder.py
index 433ccd56f0..c20d9d9f64 100644
--- a/evalml/tests/component_tests/test_target_encoder.py
+++ b/evalml/tests/component_tests/test_target_encoder.py
@@ -3,12 +3,11 @@
 import numpy as np
 import pandas as pd
 import pytest
+from pandas.testing import assert_frame_equal
 from pytest import importorskip
 
 from evalml.exceptions import ComponentNotYetFittedError
-from evalml.pipelines import RegressionPipeline
 from evalml.pipelines.components import TargetEncoder
-from evalml.preprocessing import split_data
 
 importorskip('category_encoders', reason='Skipping test because category_encoders not installed')
 
@@ -58,7 +57,7 @@ def test_null_values_in_dataframe():
                                'col_2': [0.526894, 0.526894, 0.526894, 0.6, 0.526894],
                                'col_3': [0.6, 0.6, 0.6, 0.6, 0.6, ]})
 
-    pd.testing.assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
     encoder = TargetEncoder(handle_missing='return_nan')
     encoder.fit(X, y)
@@ -66,7 +65,7 @@ def test_null_values_in_dataframe():
     X_expected = pd.DataFrame({'col_1': [0.6, 0.6, 0.6, 0.6, np.nan],
                                'col_2': [0.526894, 0.526894, 0.526894, 0.6, 0.526894],
                                'col_3': [0.6, 0.6, 0.6, 0.6, 0.6, ]})
-    pd.testing.assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
     encoder = TargetEncoder(handle_missing='error')
     with pytest.raises(ValueError, match='Columns to be encoded can not contain null'):
@@ -77,19 +76,20 @@ def test_cols():
     X = pd.DataFrame({'col_1': [1, 2, 1, 1, 2],
                       'col_2': ['2', '1', '1', '1', '1'],
                       'col_3': ["a", "a", "a", "a", "a"]})
+    X_expected = X.astype({'col_1': 'Int64', 'col_2': 'category', 'col_3': 'category'})
     y = pd.Series([0, 1, 1, 1, 0])
     encoder = TargetEncoder(cols=[])
     encoder.fit(X, y)
     X_t = encoder.transform(X)
-    pd.testing.assert_frame_equal(X, X_t)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
     encoder = TargetEncoder(cols=['col_2'])
     encoder.fit(X, y)
     X_t = encoder.transform(X)
-    X_expected = pd.DataFrame({'col_1': [1, 2, 1, 1, 2],
+    X_expected = pd.DataFrame({'col_1': pd.Series([1, 2, 1, 1, 2], dtype="Int64"),
                                'col_2': [0.60000, 0.742886, 0.742886, 0.742886, 0.742886],
-                               'col_3': ["a", "a", "a", "a", "a"]})
-    pd.testing.assert_frame_equal(X_t, X_expected, check_less_precise=True)
+                               'col_3': pd.Series(["a", "a", "a", "a", "a"], dtype="category")})
+    assert_frame_equal(X_expected, X_t.to_dataframe(), check_less_precise=True)
 
     encoder = TargetEncoder(cols=['col_2', 'col_3'])
     encoder.fit(X, y)
@@ -97,7 +97,7 @@ def test_cols():
     encoder2 = TargetEncoder()
     encoder2.fit(X, y)
     X_t2 = encoder2.transform(X)
-    pd.testing.assert_frame_equal(X_t, X_t2)
+    assert_frame_equal(X_t.to_dataframe(), X_t2.to_dataframe())
 
 
 def test_transform():
@@ -108,10 +108,10 @@ def test_transform():
     encoder = TargetEncoder()
     encoder.fit(X, y)
     X_t = encoder.transform(X)
-    X_expected = pd.DataFrame({'col_1': [1, 2, 1, 1, 2],
+    X_expected = pd.DataFrame({'col_1': pd.Series([1, 2, 1, 1, 2], dtype="Int64"),
                                'col_2': [0.6, 0.65872, 0.6, 0.65872, 0.65872],
                                'col_3': [0.504743, 0.504743, 0.504743, 0.6, 0.504743]})
-    pd.testing.assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
 
 def test_smoothing():
@@ -123,26 +123,26 @@ def test_smoothing():
     encoder = TargetEncoder(smoothing=1)
     encoder.fit(X, y)
     X_t = encoder.transform(X)
-    X_expected = pd.DataFrame({'col_1': [1, 2, 1, 1, 2],
-                               'col_2': [2, 1, 1, 1, 1],
+    X_expected = pd.DataFrame({'col_1': pd.Series([1, 2, 1, 1, 2], dtype="Int64"),
+                               'col_2': pd.Series([2, 1, 1, 1, 1], dtype="Int64"),
                                'col_3': [0.742886, 0.742886, 0.742886, 0.742886, 0.6]})
-    pd.testing.assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
     encoder = TargetEncoder(smoothing=10)
     encoder.fit(X, y)
     X_t = encoder.transform(X)
-    X_expected = pd.DataFrame({'col_1': [1, 2, 1, 1, 2],
-                               'col_2': [2, 1, 1, 1, 1],
+    X_expected = pd.DataFrame({'col_1': pd.Series([1, 2, 1, 1, 2], dtype="Int64"),
+                               'col_2': pd.Series([2, 1, 1, 1, 1], dtype="Int64"),
                                'col_3': [0.686166, 0.686166, 0.686166, 0.686166, 0.6]})
-    pd.testing.assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
     encoder = TargetEncoder(smoothing=100)
     encoder.fit(X, y)
     X_t = encoder.transform(X)
-    X_expected = pd.DataFrame({'col_1': [1, 2, 1, 1, 2],
-                               'col_2': [2, 1, 1, 1, 1],
+    X_expected = pd.DataFrame({'col_1': pd.Series([1, 2, 1, 1, 2], dtype="Int64"),
+                               'col_2': pd.Series([2, 1, 1, 1, 1], dtype="Int64"),
                                'col_3': [0.676125, 0.676125, 0.676125, 0.676125, 0.6]})
-    pd.testing.assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
 
 def test_get_feature_names():
@@ -157,20 +157,6 @@ def test_get_feature_names():
     np.testing.assert_array_equal(encoder.get_feature_names(), np.array(['col_1', 'col_2', 'col_3']))
 
 
-def test_custom_indices():
-    # custom regression pipeline
-    class MyTargetPipeline(RegressionPipeline):
-        component_graph = ['Imputer', 'Target Encoder', 'Linear Regressor']
-        custom_name = "Target Pipeline"
-
-    X = pd.DataFrame({"a": ["a", "b", "a", "a", "a", "c", "c", "c"], "b": [0, 1, 1, 1, 1, 1, 0, 1]})
-    y = pd.Series([0, 0, 0, 1, 0, 1, 0, 0], index=[7, 2, 1, 4, 5, 3, 6, 8])
-
-    x1, x2, y1, y2 = split_data(X, y, problem_type='binary')
-    tp = MyTargetPipeline({})
-    tp.fit(x2, y2)
-
-
 @patch('evalml.pipelines.components.transformers.transformer.Transformer.fit')
 def test_pandas_numpy(mock_fit, X_y_binary):
     X, y = X_y_binary
@@ -180,7 +166,7 @@ def test_pandas_numpy(mock_fit, X_y_binary):
     X_t = pd.DataFrame(X).reset_index(drop=True, inplace=False)
 
     encoder.fit(X, y)
-    pd.testing.assert_frame_equal(mock_fit.call_args[0][0], X_t)
+    assert_frame_equal(mock_fit.call_args[0][0], X_t)
 
     X_numpy = X.to_numpy()
     encoder.fit(X_numpy, y)
diff --git a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
index 42c3c07716..03726c60ca 100644
--- a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
+++ b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
@@ -2,6 +2,8 @@
 import pytest
 
 from evalml.demos import load_breast_cancer, load_diabetes, load_wine
+from evalml.pipelines import RegressionPipeline
+from evalml.preprocessing import split_data
 
 
 @pytest.mark.parametrize("target_type", ["category", "string", "bool"])
@@ -22,3 +24,17 @@ def test_woodwork_regression_pipeline(linear_regression_pipeline_class):
     mock_regression_pipeline = linear_regression_pipeline_class(parameters={'Linear Regressor': {'n_jobs': 1}})
     mock_regression_pipeline.fit(X, y)
     assert not pd.isnull(mock_regression_pipeline.predict(X)).any()
+
+
+def test_custom_indices():
+    # custom regression pipeline
+    class MyTargetPipeline(RegressionPipeline):
+        component_graph = ['Imputer', 'Target Encoder', 'Linear Regressor']
+        custom_name = "Target Pipeline"
+
+    X = pd.DataFrame({"a": ["a", "b", "a", "a", "a", "c", "c", "c"], "b": [0, 1, 1, 1, 1, 1, 0, 1]})
+    y = pd.Series([0, 0, 0, 1, 0, 1, 0, 0], index=[7, 2, 1, 4, 5, 3, 6, 8])
+
+    x1, x2, y1, y2 = split_data(X, y, problem_type='binary')
+    tp = MyTargetPipeline({})
+    tp.fit(x2, y2)

From a93c8b34aef7ba89511bb91a8212069c87eda6ee Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Mon, 11 Jan 2021 21:20:22 -0500
Subject: [PATCH 18/98] update delated feature transformer

---
 .../classifiers/xgboost_classifier.py         |  11 +-
 .../regressors/xgboost_regressor.py           |   6 +-
 .../transformers/preprocessing/__init__.py    |   2 +-
 ...ries.py => delayed_feature_transformer.py} |  24 ++-
 .../test_delayed_features_transformer.py      | 167 +++++++++---------
 .../test_xgboost_classifier.py                |   4 +-
 6 files changed, 115 insertions(+), 99 deletions(-)
 rename evalml/pipelines/components/transformers/preprocessing/{time_series.py => delayed_feature_transformer.py} (80%)

diff --git a/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py b/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py
index 8b37388ae8..e1591c3a09 100644
--- a/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py
@@ -4,7 +4,10 @@
 from evalml.pipelines.components.estimators import Estimator
 from evalml.problem_types import ProblemTypes
 from evalml.utils import get_random_seed, import_or_raise
-from evalml.utils.gen_utils import _rename_column_names_to_numeric
+from evalml.utils.gen_utils import (
+    _convert_to_woodwork_structure,
+    _rename_column_names_to_numeric
+)
 
 
 class XGBoostClassifier(Estimator):
@@ -48,12 +51,14 @@ def fit(self, X, y=None):
     def predict(self, X):
         X = _rename_column_names_to_numeric(X)
         predictions = super().predict(X)
+        predictions = _convert_to_woodwork_structure(predictions)
         return predictions
 
     def predict_proba(self, X):
         X = _rename_column_names_to_numeric(X)
-        predictions = super().predict_proba(X)
-        return predictions
+        pred_proba = super().predict_proba(X)
+        pred_proba = _convert_to_woodwork_structure(pred_proba)
+        return pred_proba
 
     @property
     def feature_importance(self):
diff --git a/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py b/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
index 6d2e5b94b7..f354bf7bcc 100644
--- a/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
@@ -4,7 +4,10 @@
 from evalml.pipelines.components.estimators import Estimator
 from evalml.problem_types import ProblemTypes
 from evalml.utils import get_random_seed, import_or_raise
-from evalml.utils.gen_utils import _rename_column_names_to_numeric
+from evalml.utils.gen_utils import (
+    _convert_to_woodwork_structure,
+    _rename_column_names_to_numeric
+)
 
 
 class XGBoostRegressor(Estimator):
@@ -47,6 +50,7 @@ def fit(self, X, y=None):
     def predict(self, X):
         X = _rename_column_names_to_numeric(X)
         predictions = super().predict(X)
+        predictions = _convert_to_woodwork_structure(predictions)
         return predictions
 
     @property
diff --git a/evalml/pipelines/components/transformers/preprocessing/__init__.py b/evalml/pipelines/components/transformers/preprocessing/__init__.py
index 294e02c9a9..1224e23644 100644
--- a/evalml/pipelines/components/transformers/preprocessing/__init__.py
+++ b/evalml/pipelines/components/transformers/preprocessing/__init__.py
@@ -3,5 +3,5 @@
 from .text_transformer import TextTransformer
 from .lsa import LSA
 from .text_featurizer import TextFeaturizer
-from .time_series import DelayedFeatureTransformer
+from .delayed_feature_transformer import DelayedFeatureTransformer
 from .featuretools import DFSTransformer
diff --git a/evalml/pipelines/components/transformers/preprocessing/time_series.py b/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
similarity index 80%
rename from evalml/pipelines/components/transformers/preprocessing/time_series.py
rename to evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
index 1c61391675..8fbad18176 100644
--- a/evalml/pipelines/components/transformers/preprocessing/time_series.py
+++ b/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
@@ -1,6 +1,10 @@
 import pandas as pd
 
 from evalml.pipelines.components.transformers.transformer import Transformer
+from evalml.utils.gen_utils import (
+    _convert_to_woodwork_structure,
+    _convert_woodwork_types_wrapper
+)
 
 
 class DelayedFeatureTransformer(Transformer):
@@ -50,17 +54,19 @@ def transform(self, X, y=None):
         If y is not None, it will also compute the delayed values for the target variable.
 
         Arguments:
-            X (pd.DataFrame or None): Data to transform. None is expected when only the target variable is being used.
-            y (pd.Series, None): Target.
+            X (ww.DataTable, pd.DataFrame or None): Data to transform. None is expected when only the target variable is being used.
+            y (ww.DataColumn, pd.Series, or None): Target.
 
         Returns:
-            pd.DataFrame: Transformed X.
+            ww.DataTable: Transformed X.
         """
-        # Normalize the data into pandas objects
-        if not isinstance(X, pd.DataFrame):
-            X = pd.DataFrame(X)
-        if y is not None and not isinstance(y, pd.Series):
-            y = pd.Series(y)
+        if X is None:
+            X = pd.DataFrame()
+        X = _convert_to_woodwork_structure(X)
+        X = _convert_woodwork_types_wrapper(X.to_dataframe())
+        if y is not None:
+            y = _convert_to_woodwork_structure(y)
+            y = _convert_woodwork_types_wrapper(y.to_series())
 
         if self.delay_features and not X.empty:
             X = X.assign(**{f"{col}_delay_{t}": X[col].shift(t)
@@ -72,4 +78,4 @@ def transform(self, X, y=None):
             X = X.assign(**{f"target_delay_{t}": y.shift(t)
                             for t in range(self.start_delay_for_target, self.max_delay + 1)})
 
-        return X
+        return _convert_to_woodwork_structure(X)
diff --git a/evalml/tests/component_tests/test_delayed_features_transformer.py b/evalml/tests/component_tests/test_delayed_features_transformer.py
index 53f3ce0b22..7748f3b8fa 100644
--- a/evalml/tests/component_tests/test_delayed_features_transformer.py
+++ b/evalml/tests/component_tests/test_delayed_features_transformer.py
@@ -1,5 +1,6 @@
 import pandas as pd
 import pytest
+from pandas.testing import assert_frame_equal
 
 from evalml.pipelines import DelayedFeatureTransformer
 
@@ -22,72 +23,72 @@ def test_delayed_features_transformer_init():
 def test_delayed_feature_extractor_maxdelay3_gap1(delayed_features_data):
     X, y = delayed_features_data
 
-    answer = pd.DataFrame({"feature": X.feature,
-                           "feature_delay_1": X.feature.shift(1),
-                           "feature_delay_2": X.feature.shift(2),
-                           "feature_delay_3": X.feature.shift(3),
-                           "target_delay_0": y,
-                           "target_delay_1": y.shift(1),
-                           "target_delay_2": y.shift(2),
-                           "target_delay_3": y.shift(3)})
+    expected = pd.DataFrame({"feature": X.feature.astype("Int64"),
+                             "feature_delay_1": X.feature.shift(1),
+                             "feature_delay_2": X.feature.shift(2),
+                             "feature_delay_3": X.feature.shift(3),
+                             "target_delay_0": y.astype("Int64"),
+                             "target_delay_1": y.shift(1),
+                             "target_delay_2": y.shift(2),
+                             "target_delay_3": y.shift(3)})
 
-    pd.testing.assert_frame_equal(DelayedFeatureTransformer(max_delay=3, gap=1).fit_transform(X=X, y=y), answer)
+    assert_frame_equal(expected, DelayedFeatureTransformer(max_delay=3, gap=1).fit_transform(X=X, y=y).to_dataframe())
 
-    answer_only_y = pd.DataFrame({"target_delay_0": y,
-                                  "target_delay_1": y.shift(1),
-                                  "target_delay_2": y.shift(2),
-                                  "target_delay_3": y.shift(3)})
-    pd.testing.assert_frame_equal(DelayedFeatureTransformer(max_delay=3, gap=1).fit_transform(X=None, y=y), answer_only_y)
+    expected_only_y = pd.DataFrame({"target_delay_0": y.astype("Int64"),
+                                    "target_delay_1": y.shift(1),
+                                    "target_delay_2": y.shift(2),
+                                    "target_delay_3": y.shift(3)})
+    assert_frame_equal(expected_only_y, DelayedFeatureTransformer(max_delay=3, gap=1).fit_transform(X=None, y=y).to_dataframe())
 
 
 def test_delayed_feature_extractor_maxdelay5_gap1(delayed_features_data):
 
     X, y = delayed_features_data
 
-    answer = pd.DataFrame({"feature": X.feature,
-                           "feature_delay_1": X.feature.shift(1),
-                           "feature_delay_2": X.feature.shift(2),
-                           "feature_delay_3": X.feature.shift(3),
-                           "feature_delay_4": X.feature.shift(4),
-                           "feature_delay_5": X.feature.shift(5),
-                           "target_delay_0": y,
-                           "target_delay_1": y.shift(1),
-                           "target_delay_2": y.shift(2),
-                           "target_delay_3": y.shift(3),
-                           "target_delay_4": y.shift(4),
-                           "target_delay_5": y.shift(5)})
-
-    pd.testing.assert_frame_equal(DelayedFeatureTransformer(max_delay=5, gap=1).fit_transform(X, y), answer)
-
-    answer_only_y = pd.DataFrame({"target_delay_0": y,
-                                  "target_delay_1": y.shift(1),
-                                  "target_delay_2": y.shift(2),
-                                  "target_delay_3": y.shift(3),
-                                  "target_delay_4": y.shift(4),
-                                  "target_delay_5": y.shift(5)})
-    pd.testing.assert_frame_equal(DelayedFeatureTransformer(max_delay=5, gap=1).fit_transform(X=None, y=y), answer_only_y)
+    expected = pd.DataFrame({"feature": X.feature.astype("Int64"),
+                             "feature_delay_1": X.feature.shift(1),
+                             "feature_delay_2": X.feature.shift(2),
+                             "feature_delay_3": X.feature.shift(3),
+                             "feature_delay_4": X.feature.shift(4),
+                             "feature_delay_5": X.feature.shift(5),
+                             "target_delay_0": y.astype("Int64"),
+                             "target_delay_1": y.shift(1),
+                             "target_delay_2": y.shift(2),
+                             "target_delay_3": y.shift(3),
+                             "target_delay_4": y.shift(4),
+                             "target_delay_5": y.shift(5)})
+
+    assert_frame_equal(expected, DelayedFeatureTransformer(max_delay=5, gap=1).fit_transform(X, y).to_dataframe())
+
+    expected_only_y = pd.DataFrame({"target_delay_0": y.astype("Int64"),
+                                    "target_delay_1": y.shift(1),
+                                    "target_delay_2": y.shift(2),
+                                    "target_delay_3": y.shift(3),
+                                    "target_delay_4": y.shift(4),
+                                    "target_delay_5": y.shift(5)})
+    assert_frame_equal(expected_only_y, DelayedFeatureTransformer(max_delay=5, gap=1).fit_transform(X=None, y=y).to_dataframe())
 
 
 def test_delayed_feature_extractor_maxdelay3_gap7(delayed_features_data):
 
     X, y = delayed_features_data
 
-    answer = pd.DataFrame({"feature": X.feature,
-                           "feature_delay_1": X.feature.shift(1),
-                           "feature_delay_2": X.feature.shift(2),
-                           "feature_delay_3": X.feature.shift(3),
-                           "target_delay_0": y,
-                           "target_delay_1": y.shift(1),
-                           "target_delay_2": y.shift(2),
-                           "target_delay_3": y.shift(3)})
+    expected = pd.DataFrame({"feature": X.feature.astype("Int64"),
+                             "feature_delay_1": X.feature.shift(1),
+                             "feature_delay_2": X.feature.shift(2),
+                             "feature_delay_3": X.feature.shift(3),
+                             "target_delay_0": y.astype("Int64"),
+                             "target_delay_1": y.shift(1),
+                             "target_delay_2": y.shift(2),
+                             "target_delay_3": y.shift(3)})
 
-    pd.testing.assert_frame_equal(DelayedFeatureTransformer(max_delay=3, gap=7).fit_transform(X, y), answer)
+    assert_frame_equal(expected, DelayedFeatureTransformer(max_delay=3, gap=7).fit_transform(X, y).to_dataframe())
 
-    answer_only_y = pd.DataFrame({"target_delay_0": y,
-                                  "target_delay_1": y.shift(1),
-                                  "target_delay_2": y.shift(2),
-                                  "target_delay_3": y.shift(3)})
-    pd.testing.assert_frame_equal(DelayedFeatureTransformer(max_delay=3, gap=7).fit_transform(X=None, y=y), answer_only_y)
+    expected_only_y = pd.DataFrame({"target_delay_0": y.astype("Int64"),
+                                    "target_delay_1": y.shift(1),
+                                    "target_delay_2": y.shift(2),
+                                    "target_delay_3": y.shift(3)})
+    assert_frame_equal(expected_only_y, DelayedFeatureTransformer(max_delay=3, gap=7).fit_transform(X=None, y=y).to_dataframe())
 
 
 def test_delayed_feature_extractor_numpy(delayed_features_data):
@@ -95,33 +96,33 @@ def test_delayed_feature_extractor_numpy(delayed_features_data):
     X_np = X.values
     y_np = y.values
 
-    answer = pd.DataFrame({0: X.feature,
-                           "0_delay_1": X.feature.shift(1),
-                           "0_delay_2": X.feature.shift(2),
-                           "0_delay_3": X.feature.shift(3),
-                           "target_delay_0": y,
-                           "target_delay_1": y.shift(1),
-                           "target_delay_2": y.shift(2),
-                           "target_delay_3": y.shift(3)})
+    expected = pd.DataFrame({0: X.feature.astype("Int64"),
+                             "0_delay_1": X.feature.shift(1),
+                             "0_delay_2": X.feature.shift(2),
+                             "0_delay_3": X.feature.shift(3),
+                             "target_delay_0": y.astype("Int64"),
+                             "target_delay_1": y.shift(1),
+                             "target_delay_2": y.shift(2),
+                             "target_delay_3": y.shift(3)})
 
-    pd.testing.assert_frame_equal(DelayedFeatureTransformer(max_delay=3, gap=7).fit_transform(X_np, y_np), answer)
+    assert_frame_equal(expected, DelayedFeatureTransformer(max_delay=3, gap=7).fit_transform(X_np, y_np).to_dataframe())
 
-    answer_only_y = pd.DataFrame({"target_delay_0": y,
-                                  "target_delay_1": y.shift(1),
-                                  "target_delay_2": y.shift(2),
-                                  "target_delay_3": y.shift(3)})
-    pd.testing.assert_frame_equal(DelayedFeatureTransformer(max_delay=3, gap=7).fit_transform(X=None, y=y_np), answer_only_y)
+    expected_only_y = pd.DataFrame({"target_delay_0": y.astype("Int64"),
+                                    "target_delay_1": y.shift(1),
+                                    "target_delay_2": y.shift(2),
+                                    "target_delay_3": y.shift(3)})
+    assert_frame_equal(expected_only_y, DelayedFeatureTransformer(max_delay=3, gap=7).fit_transform(X=None, y=y_np).to_dataframe())
 
 
 @pytest.mark.parametrize("delay_features,delay_target", [(False, True), (True, False), (False, False)])
 def test_lagged_feature_extractor_delay_features_delay_target(delay_features, delay_target, delayed_features_data):
     X, y = delayed_features_data
 
-    all_delays = pd.DataFrame({"feature": X.feature,
+    all_delays = pd.DataFrame({"feature": X.feature.astype("Int64"),
                                "feature_delay_1": X.feature.shift(1),
                                "feature_delay_2": X.feature.shift(2),
                                "feature_delay_3": X.feature.shift(3),
-                               "target_delay_0": y,
+                               "target_delay_0": y.astype("Int64"),
                                "target_delay_1": y.shift(1),
                                "target_delay_2": y.shift(2),
                                "target_delay_3": y.shift(3)})
@@ -132,44 +133,44 @@ def test_lagged_feature_extractor_delay_features_delay_target(delay_features, de
 
     transformer = DelayedFeatureTransformer(max_delay=3, gap=1,
                                             delay_features=delay_features, delay_target=delay_target)
-    pd.testing.assert_frame_equal(transformer.fit_transform(X, y), all_delays)
+    assert_frame_equal(all_delays, transformer.fit_transform(X, y).to_dataframe())
 
 
 @pytest.mark.parametrize("delay_features,delay_target", [(False, True), (True, False), (False, False)])
 def test_lagged_feature_extractor_delay_target(delay_features, delay_target, delayed_features_data):
     X, y = delayed_features_data
 
-    answer = pd.DataFrame()
+    expected = pd.DataFrame()
     if delay_target:
-        answer = pd.DataFrame({"target_delay_0": y,
-                               "target_delay_1": y.shift(1),
-                               "target_delay_2": y.shift(2),
-                               "target_delay_3": y.shift(3)})
+        expected = pd.DataFrame({"target_delay_0": y.astype("Int64"),
+                                 "target_delay_1": y.shift(1),
+                                 "target_delay_2": y.shift(2),
+                                 "target_delay_3": y.shift(3)})
 
     transformer = DelayedFeatureTransformer(max_delay=3, gap=1,
                                             delay_features=delay_features, delay_target=delay_target)
-    pd.testing.assert_frame_equal(transformer.fit_transform(None, y), answer)
+    assert_frame_equal(transformer.fit_transform(None, y).to_dataframe(), expected)
 
 
 @pytest.mark.parametrize("gap", [0, 1, 7])
 def test_target_delay_when_gap_is_0(gap, delayed_features_data):
     X, y = delayed_features_data
 
-    answer = pd.DataFrame({"feature": X.feature,
-                           "feature_delay_1": X.feature.shift(1),
-                           "target_delay_0": y,
-                           "target_delay_1": y.shift(1)})
+    expected = pd.DataFrame({"feature": X.feature.astype("Int64"),
+                             "feature_delay_1": X.feature.shift(1),
+                             "target_delay_0": y.astype("Int64"),
+                             "target_delay_1": y.shift(1)})
 
     if gap == 0:
-        answer = answer.drop(columns=["target_delay_0"])
+        expected = expected.drop(columns=["target_delay_0"])
 
     transformer = DelayedFeatureTransformer(max_delay=1, gap=gap)
-    pd.testing.assert_frame_equal(transformer.fit_transform(X, y), answer)
+    assert_frame_equal(transformer.fit_transform(X, y).to_dataframe(), expected)
 
-    answer = pd.DataFrame({"target_delay_0": y,
-                           "target_delay_1": y.shift(1)})
+    expected = pd.DataFrame({"target_delay_0": y.astype("Int64"),
+                             "target_delay_1": y.shift(1)})
 
     if gap == 0:
-        answer = answer.drop(columns=["target_delay_0"])
+        expected = expected.drop(columns=["target_delay_0"])
 
-    pd.testing.assert_frame_equal(transformer.fit_transform(None, y), answer)
+    assert_frame_equal(transformer.fit_transform(None, y).to_dataframe(), expected)
diff --git a/evalml/tests/component_tests/test_xgboost_classifier.py b/evalml/tests/component_tests/test_xgboost_classifier.py
index 80521263cf..d6d76b1e12 100644
--- a/evalml/tests/component_tests/test_xgboost_classifier.py
+++ b/evalml/tests/component_tests/test_xgboost_classifier.py
@@ -64,11 +64,11 @@ def test_xgboost_feature_name_with_random_ascii(problem_type, X_y_binary, X_y_mu
     clf.fit(X, y)
     predictions = clf.predict(X)
     assert len(predictions) == len(y)
-    assert not np.isnan(predictions).all()
+    assert not np.isnan(predictions.to_series()).all()
 
     predictions = clf.predict_proba(X)
     assert predictions.shape == (len(y), expected_cols)
-    assert not np.isnan(predictions).all().all()
+    assert not np.isnan(predictions.to_dataframe()).all().all()
 
     assert len(clf.feature_importance) == len(X.columns)
     assert not np.isnan(clf.feature_importance).all().all()

From 094698db577e91fa0364306bbc3c4af0d9d04bc1 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Mon, 11 Jan 2021 21:44:27 -0500
Subject: [PATCH 19/98] fix estimator tests

---
 .../components/estimators/classifiers/catboost_classifier.py | 1 +
 evalml/tests/component_tests/test_estimators.py              | 5 +++--
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py b/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
index ab979654a6..ee3d6d8ddd 100644
--- a/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
@@ -83,6 +83,7 @@ def predict(self, X):
             predictions = self._label_encoder.inverse_transform(predictions.astype(np.int64))
         if not isinstance(predictions, pd.Series):
             predictions = pd.Series(predictions)
+        predictions = _convert_to_woodwork_structure(predictions)
         return predictions
 
     @property
diff --git a/evalml/tests/component_tests/test_estimators.py b/evalml/tests/component_tests/test_estimators.py
index 2f26be8e5f..8ef2e8a360 100644
--- a/evalml/tests/component_tests/test_estimators.py
+++ b/evalml/tests/component_tests/test_estimators.py
@@ -27,7 +27,8 @@ def test_estimators_feature_name_with_random_ascii(X_y_binary, X_y_multi, X_y_re
             clf.fit(X, y)
             assert len(clf.feature_importance) == len(X.columns)
             assert not np.isnan(clf.feature_importance).all().all()
-            predictions = clf.predict(X)
+            print (clf.name)
+            predictions = clf.predict(X).to_series()
             assert len(predictions) == len(y)
             assert not np.isnan(predictions).all()
 
@@ -41,7 +42,7 @@ def test_binary_classification_estimators_predict_proba_col_order(helper_functio
         if ProblemTypes.BINARY in supported_problem_types:
             estimator = helper_functions.safe_init_component_with_njobs_1(estimator_class)
             estimator.fit(X, y)
-            predicted_proba = estimator.predict_proba(X)
+            predicted_proba = estimator.predict_proba(X).to_dataframe()
             expected = np.concatenate([(1 - data).reshape(-1, 1), data.reshape(-1, 1)], axis=1)
             np.testing.assert_allclose(expected, np.round(predicted_proba).values)
 

From 72a0b9d8a8078027f01a011351181bebb12faaf0 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Mon, 11 Jan 2021 22:49:05 -0500
Subject: [PATCH 20/98] fix some component tests, more to go

---
 .../transformers/preprocessing/lsa.py         |   3 +-
 .../preprocessing/text_featurizer.py          |   2 +-
 .../components/transformers/transformer.py    |   1 +
 evalml/pipelines/components/utils.py          |   6 +-
 .../tests/component_tests/test_components.py  | 114 ++----------------
 .../tests/component_tests/test_estimators.py  |  91 +++++++++++++-
 6 files changed, 110 insertions(+), 107 deletions(-)

diff --git a/evalml/pipelines/components/transformers/preprocessing/lsa.py b/evalml/pipelines/components/transformers/preprocessing/lsa.py
index ce1eb658c4..fcaa1e2f29 100644
--- a/evalml/pipelines/components/transformers/preprocessing/lsa.py
+++ b/evalml/pipelines/components/transformers/preprocessing/lsa.py
@@ -53,9 +53,10 @@ def transform(self, X, y=None):
                           format `LSA(original_column_name)[feature_number]`, where `feature_number` is 0 or 1.
         """
         X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
         if len(self._all_text_columns) == 0:
             return X
+
+        X = _convert_woodwork_types_wrapper(X.to_dataframe())
         X_t = X.copy()
         text_columns = self._get_text_columns(X)
         for col in text_columns:
diff --git a/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py b/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
index a3fd15e5e3..24cc63c8ec 100644
--- a/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
@@ -97,10 +97,10 @@ def transform(self, X, y=None):
             ww.DataTable: Transformed X
         """
         X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
         if self._features is None or len(self._features) == 0:
             return X
 
+        X = _convert_woodwork_types_wrapper(X.to_dataframe())
         text_columns = self._get_text_columns(X)
         es = self._make_entity_set(X, text_columns)
         X_nlp_primitives = ft.calculate_feature_matrix(features=self._features, entityset=es)
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 5df6531aa4..f9f421bd4b 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -4,6 +4,7 @@
 from evalml.utils.gen_utils import (
     _convert_to_woodwork_structure,
     _convert_woodwork_types_wrapper
+)
 
 
 class Transformer(ComponentBase):
diff --git a/evalml/pipelines/components/utils.py b/evalml/pipelines/components/utils.py
index 8e23b0078a..f50e990e0a 100644
--- a/evalml/pipelines/components/utils.py
+++ b/evalml/pipelines/components/utils.py
@@ -147,7 +147,7 @@ def predict(self, X):
             pd.Series: Predicted values
         """
         check_is_fitted(self, 'is_fitted_')
-        return self.pipeline.predict(X).to_numpy()
+        return self.pipeline.predict(X).to_dataframe().to_numpy()
 
     def predict_proba(self, X):
         """Make probability estimates for labels.
@@ -158,7 +158,7 @@ def predict_proba(self, X):
         Returns:
             pd.DataFrame: Probability estimates
         """
-        return self.pipeline.predict_proba(X).to_numpy()
+        return self.pipeline.predict_proba(X).to_dataframe().to_numpy()
 
 
 class WrappedSKRegressor(BaseEstimator, RegressorMixin):
@@ -195,7 +195,7 @@ def predict(self, X):
         Returns:
             pd.Series: Predicted values
         """
-        return self.pipeline.predict(X).to_numpy()
+        return self.pipeline.predict(X).to_dataframe().to_numpy()
 
 
 def scikit_learn_wrapped_estimator(evalml_obj):
diff --git a/evalml/tests/component_tests/test_components.py b/evalml/tests/component_tests/test_components.py
index 10cc96203f..95b297bac1 100644
--- a/evalml/tests/component_tests/test_components.py
+++ b/evalml/tests/component_tests/test_components.py
@@ -8,6 +8,7 @@
 import numpy as np
 import pandas as pd
 import pytest
+import woodwork as ww
 from skopt.space import Categorical
 
 from evalml.exceptions import (
@@ -61,7 +62,6 @@
 )
 from evalml.pipelines.components.utils import (
     _all_estimators,
-    _all_estimators_used_in_search,
     _all_transformers,
     all_components,
     generate_component_code
@@ -535,85 +535,44 @@ def test_transformer_transform_output_type(X_y_binary):
 
             component.fit(X, y=y)
             transform_output = component.transform(X, y=y)
-            assert isinstance(transform_output, pd.DataFrame)
+            assert isinstance(transform_output, ww.DataTable)
 
             if isinstance(component, SelectColumns):
                 assert transform_output.shape == (X.shape[0], 0)
-                assert isinstance(transform_output.columns, pd.Index)
+                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             elif isinstance(component, PCA) or isinstance(component, LinearDiscriminantAnalysis):
                 assert transform_output.shape[0] == X.shape[0]
                 assert transform_output.shape[1] <= X.shape[1]
-                assert isinstance(transform_output.columns, pd.Index)
+                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             elif isinstance(component, DFSTransformer):
                 assert transform_output.shape[0] == X.shape[0]
                 assert transform_output.shape[1] >= X.shape[1]
-                assert isinstance(transform_output.columns, pd.Index)
+                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             elif isinstance(component, DelayedFeatureTransformer):
                 # We just want to check that DelayedFeaturesTransformer outputs a DataFrame
                 # The dataframe shape and index are checked in test_delayed_features_transformer.py
                 continue
             else:
                 assert transform_output.shape == X.shape
-                assert (transform_output.columns == X_cols_expected).all()
+                assert (transform_output.to_dataframe().columns == X_cols_expected).all()
 
             transform_output = component.fit_transform(X, y=y)
-            assert isinstance(transform_output, pd.DataFrame)
+            assert isinstance(transform_output, ww.DataTable)
 
             if isinstance(component, SelectColumns):
                 assert transform_output.shape == (X.shape[0], 0)
-                assert isinstance(transform_output.columns, pd.Index)
+                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             elif isinstance(component, PCA) or isinstance(component, LinearDiscriminantAnalysis):
                 assert transform_output.shape[0] == X.shape[0]
                 assert transform_output.shape[1] <= X.shape[1]
-                assert isinstance(transform_output.columns, pd.Index)
+                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             elif isinstance(component, DFSTransformer):
                 assert transform_output.shape[0] == X.shape[0]
                 assert transform_output.shape[1] >= X.shape[1]
-                assert isinstance(transform_output.columns, pd.Index)
+                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             else:
                 assert transform_output.shape == X.shape
-                assert (transform_output.columns == X_cols_expected).all()
-
-
-def test_estimator_predict_output_type(X_y_binary, helper_functions):
-    X_np, y_np = X_y_binary
-    assert isinstance(X_np, np.ndarray)
-    assert isinstance(y_np, np.ndarray)
-    y_list = list(y_np)
-    X_df_no_col_names = pd.DataFrame(X_np)
-    range_index = pd.RangeIndex(start=0, stop=X_np.shape[1], step=1)
-    X_df_with_col_names = pd.DataFrame(X_np, columns=['x' + str(i) for i in range(X_np.shape[1])])
-    y_series_no_name = pd.Series(y_np)
-    y_series_with_name = pd.Series(y_np, name='target')
-    datatype_combos = [(X_np, y_np, range_index, np.unique(y_np)),
-                       (X_np, y_list, range_index, np.unique(y_np)),
-                       (X_df_no_col_names, y_series_no_name, range_index, y_series_no_name.unique()),
-                       (X_df_with_col_names, y_series_with_name, X_df_with_col_names.columns, y_series_with_name.unique())]
-
-    for component_class in _all_estimators_used_in_search():
-        for X, y, X_cols_expected, y_cols_expected in datatype_combos:
-            print('Checking output of predict for estimator "{}" on X type {} cols {}, y type {} name {}'
-                  .format(component_class.name, type(X),
-                          X.columns if isinstance(X, pd.DataFrame) else None, type(y),
-                          y.name if isinstance(y, pd.Series) else None))
-            component = helper_functions.safe_init_component_with_njobs_1(component_class)
-            component.fit(X, y=y)
-            predict_output = component.predict(X)
-            assert isinstance(predict_output, pd.Series)
-            assert len(predict_output) == len(y)
-            assert predict_output.name is None
-
-            if not ((ProblemTypes.BINARY in component_class.supported_problem_types) or
-                    (ProblemTypes.MULTICLASS in component_class.supported_problem_types)):
-                continue
-            print('Checking output of predict_proba for estimator "{}" on X type {} cols {}, y type {} name {}'
-                  .format(component_class.name, type(X),
-                          X.columns if isinstance(X, pd.DataFrame) else None, type(y),
-                          y.name if isinstance(y, pd.Series) else None))
-            predict_proba_output = component.predict_proba(X)
-            assert isinstance(predict_proba_output, pd.DataFrame)
-            assert predict_proba_output.shape == (len(y), len(np.unique(y)))
-            assert (predict_proba_output.columns == y_cols_expected).all()
+                assert (transform_output.to_dataframe().columns == X_cols_expected).all()
 
 
 @pytest.mark.parametrize("cls", [cls for cls in all_components() if cls not in [StackedEnsembleRegressor, StackedEnsembleClassifier]])
@@ -638,10 +597,10 @@ def fit(self, X, y):
             pass
 
         def predict(self, X):
-            pass
+            return pd.Series()
 
         def predict_proba(self, X):
-            pass
+            return pd.DataFrame()
 
     class MockEstimator(Estimator):
         name = "Mock Estimator"
@@ -664,53 +623,6 @@ def __init__(self, parameters=None, component_obj=None, random_state=0):
     est.predict_proba(X)
 
 
-def test_estimator_check_for_fit_with_overrides(X_y_binary):
-    class MockEstimatorWithOverrides(Estimator):
-        name = "Mock Estimator"
-        model_family = ModelFamily.LINEAR_MODEL
-        supported_problem_types = ['binary']
-
-        def fit(self, X, y):
-            pass
-
-        def predict(self, X):
-            pass
-
-        def predict_proba(self, X):
-            pass
-
-    class MockEstimatorWithOverridesSubclass(Estimator):
-        name = "Mock Estimator Subclass"
-        model_family = ModelFamily.LINEAR_MODEL
-        supported_problem_types = ['binary']
-
-        def fit(self, X, y):
-            pass
-
-        def predict(self, X):
-            pass
-
-        def predict_proba(self, X):
-            pass
-
-    X, y = X_y_binary
-    est = MockEstimatorWithOverrides()
-    est_subclass = MockEstimatorWithOverridesSubclass()
-
-    with pytest.raises(ComponentNotYetFittedError, match='You must fit'):
-        est.predict(X)
-    with pytest.raises(ComponentNotYetFittedError, match='You must fit'):
-        est_subclass.predict(X)
-
-    est.fit(X, y)
-    est.predict(X)
-    est.predict_proba(X)
-
-    est_subclass.fit(X, y)
-    est_subclass.predict(X)
-    est_subclass.predict_proba(X)
-
-
 def test_transformer_check_for_fit(X_y_binary):
     class MockTransformerObj():
         def __init__(self):
diff --git a/evalml/tests/component_tests/test_estimators.py b/evalml/tests/component_tests/test_estimators.py
index e98c690175..339414a621 100644
--- a/evalml/tests/component_tests/test_estimators.py
+++ b/evalml/tests/component_tests/test_estimators.py
@@ -3,7 +3,9 @@
 import numpy as np
 import pandas as pd
 import pytest
+import woodwork as ww
 
+from evalml.exceptions import ComponentNotYetFittedError
 from evalml.model_family import ModelFamily
 from evalml.pipelines.components import Estimator
 from evalml.pipelines.components.utils import (
@@ -31,7 +33,6 @@ def test_estimators_feature_name_with_random_ascii(X_y_binary, X_y_multi, X_y_re
             clf.fit(X, y)
             assert len(clf.feature_importance) == len(X.columns)
             assert not np.isnan(clf.feature_importance).all().all()
-            print (clf.name)
             predictions = clf.predict(X).to_series()
             assert len(predictions) == len(y)
             assert not np.isnan(predictions).all()
@@ -86,3 +87,91 @@ def test_all_estimators_check_fit_input_type_regression(data_type, X_y_regressio
         component = helper_functions.safe_init_component_with_njobs_1(component_class)
         component.fit(X, y)
         component.predict(X)
+
+
+def test_estimator_predict_output_type(X_y_binary, helper_functions):
+    X_np, y_np = X_y_binary
+    assert isinstance(X_np, np.ndarray)
+    assert isinstance(y_np, np.ndarray)
+    y_list = list(y_np)
+    X_df_no_col_names = pd.DataFrame(X_np)
+    range_index = pd.RangeIndex(start=0, stop=X_np.shape[1], step=1)
+    X_df_with_col_names = pd.DataFrame(X_np, columns=['x' + str(i) for i in range(X_np.shape[1])])
+    y_series_no_name = pd.Series(y_np)
+    y_series_with_name = pd.Series(y_np, name='target')
+    datatype_combos = [(X_np, y_np, range_index, np.unique(y_np)),
+                       (X_np, y_list, range_index, np.unique(y_np)),
+                       (X_df_no_col_names, y_series_no_name, range_index, y_series_no_name.unique()),
+                       (X_df_with_col_names, y_series_with_name, X_df_with_col_names.columns, y_series_with_name.unique())]
+
+    for component_class in _all_estimators_used_in_search():
+        for X, y, X_cols_expected, y_cols_expected in datatype_combos:
+            print('Checking output of predict for estimator "{}" on X type {} cols {}, y type {} name {}'
+                  .format(component_class.name, type(X),
+                          X.columns if isinstance(X, pd.DataFrame) else None, type(y),
+                          y.name if isinstance(y, pd.Series) else None))
+            component = helper_functions.safe_init_component_with_njobs_1(component_class)
+            component.fit(X, y=y)
+            predict_output = component.predict(X)
+            assert isinstance(predict_output, ww.DataColumn)
+            assert len(predict_output) == len(y)
+            assert predict_output.name is None
+
+            if not ((ProblemTypes.BINARY in component_class.supported_problem_types) or
+                    (ProblemTypes.MULTICLASS in component_class.supported_problem_types)):
+                continue
+            print('Checking output of predict_proba for estimator "{}" on X type {} cols {}, y type {} name {}'
+                  .format(component_class.name, type(X),
+                          X.columns if isinstance(X, pd.DataFrame) else None, type(y),
+                          y.name if isinstance(y, pd.Series) else None))
+            predict_proba_output = component.predict_proba(X)
+            assert isinstance(predict_proba_output, ww.DataTable)
+            assert predict_proba_output.shape == (len(y), len(np.unique(y)))
+            assert (list(predict_proba_output.columns) == y_cols_expected).all()
+
+
+def test_estimator_check_for_fit_with_overrides(X_y_binary):
+    class MockEstimatorWithOverrides(Estimator):
+        name = "Mock Estimator"
+        model_family = ModelFamily.LINEAR_MODEL
+        supported_problem_types = ['binary']
+
+        def fit(self, X, y):
+            pass
+
+        def predict(self, X):
+            pass
+
+        def predict_proba(self, X):
+            pass
+
+    class MockEstimatorWithOverridesSubclass(Estimator):
+        name = "Mock Estimator Subclass"
+        model_family = ModelFamily.LINEAR_MODEL
+        supported_problem_types = ['binary']
+
+        def fit(self, X, y):
+            pass
+
+        def predict(self, X):
+            pass
+
+        def predict_proba(self, X):
+            pass
+
+    X, y = X_y_binary
+    est = MockEstimatorWithOverrides()
+    est_subclass = MockEstimatorWithOverridesSubclass()
+
+    with pytest.raises(ComponentNotYetFittedError, match='You must fit'):
+        est.predict(X)
+    with pytest.raises(ComponentNotYetFittedError, match='You must fit'):
+        est_subclass.predict(X)
+
+    est.fit(X, y)
+    est.predict(X)
+    est.predict_proba(X)
+
+    est_subclass.fit(X, y)
+    est_subclass.predict(X)
+    est_subclass.predict_proba(X)

From 86f4dbcbfe353748f6ff102019c1e04e3566016b Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Mon, 11 Jan 2021 23:14:46 -0500
Subject: [PATCH 21/98] continue fixing tests, more to go

---
 evalml/pipelines/classification_pipeline.py | 10 ++++++----
 evalml/pipelines/components/utils.py        |  4 ++--
 evalml/pipelines/pipeline_base.py           |  6 ++++--
 3 files changed, 12 insertions(+), 8 deletions(-)

diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index a74e295b9e..9fd4811fba 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -91,7 +91,8 @@ def predict(self, X, objective=None):
             pd.Series : Estimated labels
         """
         predictions = self._predict(X, objective)
-        return pd.Series(self._decode_targets(predictions), name=self.input_target_name)
+        predictions = pd.Series(self._decode_targets(predictions), name=self.input_target_name)
+        return _convert_to_woodwork_structure(predictions)
 
     def predict_proba(self, X):
         """Make probability estimates for labels.
@@ -103,9 +104,9 @@ def predict_proba(self, X):
             pd.DataFrame: Probability estimates
         """
         X = self.compute_estimator_features(X, y=None)
-        proba = self.estimator.predict_proba(X)
+        proba = self.estimator.predict_proba(X).to_dataframe()
         proba.columns = self._encoder.classes_
-        return proba
+        return _convert_to_woodwork_structure(proba)
 
     def score(self, X, y, objectives):
         """Evaluate model performance on objectives
@@ -123,7 +124,8 @@ def score(self, X, y, objectives):
         objectives = [get_objective(o, return_instance=True) for o in objectives]
         y = self._encode_targets(y)
         y_predicted, y_predicted_proba = self._compute_predictions(X, objectives)
-
+        y_predicted = _convert_to_woodwork_structure(y_predicted)
+        y_predicted_proba = _convert_to_woodwork_structure(y_predicted_proba)
         return self._score_all_objectives(X, y, y_predicted, y_predicted_proba, objectives)
 
     def _compute_predictions(self, X, objectives):
diff --git a/evalml/pipelines/components/utils.py b/evalml/pipelines/components/utils.py
index f50e990e0a..f91d6a12a0 100644
--- a/evalml/pipelines/components/utils.py
+++ b/evalml/pipelines/components/utils.py
@@ -147,7 +147,7 @@ def predict(self, X):
             pd.Series: Predicted values
         """
         check_is_fitted(self, 'is_fitted_')
-        return self.pipeline.predict(X).to_dataframe().to_numpy()
+        return self.pipeline.predict(X).to_series().to_numpy()
 
     def predict_proba(self, X):
         """Make probability estimates for labels.
@@ -195,7 +195,7 @@ def predict(self, X):
         Returns:
             pd.Series: Predicted values
         """
-        return self.pipeline.predict(X).to_dataframe().to_numpy()
+        return self.pipeline.predict(X).to_series().to_numpy()
 
 
 def scikit_learn_wrapped_estimator(evalml_obj):
diff --git a/evalml/pipelines/pipeline_base.py b/evalml/pipelines/pipeline_base.py
index 1d820a478d..6dd7b9436a 100644
--- a/evalml/pipelines/pipeline_base.py
+++ b/evalml/pipelines/pipeline_base.py
@@ -222,11 +222,13 @@ def predict(self, X, objective=None):
             objective (Object or string): The objective to use to make predictions
 
         Returns:
-            pd.Series: Predicted values.
+            ww.DataColumn: Predicted values.
         """
         X = _convert_to_woodwork_structure(X)
         predictions = self._component_graph.predict(X)
-        return predictions.rename(self.input_target_name)
+        predictions_series = predictions.to_series()
+        predictions_series.name = self.input_target_name
+        return _convert_to_woodwork_structure(predictions_series)
 
     @abstractmethod
     def score(self, X, y, objectives):

From 350aa6960e18e3e8c7c673de1e0dd48e39b68fef Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 12 Jan 2021 13:29:04 -0500
Subject: [PATCH 22/98] fix one more test

---
 evalml/tests/component_tests/test_components.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/evalml/tests/component_tests/test_components.py b/evalml/tests/component_tests/test_components.py
index 95b297bac1..7487a51436 100644
--- a/evalml/tests/component_tests/test_components.py
+++ b/evalml/tests/component_tests/test_components.py
@@ -313,7 +313,7 @@ class MockTransformerWithFitTransform(Transformer):
         hyperparameter_ranges = {}
 
         def fit_transform(self, X, y=None):
-            return X
+            return ww.DataTable(X)
 
         def __init__(self):
             parameters = {}
@@ -342,7 +342,7 @@ def fit(self, X, y=None):
             return self
 
         def transform(self, X, y=None):
-            return X
+            return ww.DataTable(X)
 
         def __init__(self):
             parameters = {}
@@ -369,14 +369,14 @@ def __init__(self):
     y = pd.Series(y)
 
     component = MockTransformerWithFitTransform()
-    assert isinstance(component.fit_transform(X, y), pd.DataFrame)
+    assert isinstance(component.fit_transform(X, y), ww.DataTable)
 
     component = MockTransformerWithFitTransformButError()
     with pytest.raises(RuntimeError):
         component.fit_transform(X, y)
 
     component = MockTransformerWithFitAndTransform()
-    assert isinstance(component.fit_transform(X, y), pd.DataFrame)
+    assert isinstance(component.fit_transform(X, y), ww.DataTable)
 
     component = MockTransformerWithOnlyFit()
     with pytest.raises(MethodPropertyNotFoundError):
@@ -554,7 +554,7 @@ def test_transformer_transform_output_type(X_y_binary):
                 continue
             else:
                 assert transform_output.shape == X.shape
-                assert (transform_output.to_dataframe().columns == X_cols_expected).all()
+                assert (list(transform_output.columns) == X_cols_expected).all()
 
             transform_output = component.fit_transform(X, y=y)
             assert isinstance(transform_output, ww.DataTable)
@@ -632,7 +632,7 @@ def fit(self, X, y):
             pass
 
         def transform(self, X):
-            pass
+            return pd.DataFrame()
 
     class MockTransformer(Transformer):
         name = "Mock Transformer"

From fc45967bf6dde88003d3c22df417946a3e609840 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 12 Jan 2021 14:16:01 -0500
Subject: [PATCH 23/98] fix component tests

---
 .../transformers/encoders/target_encoder.py   |  8 ++--
 .../feature_selection/feature_selector.py     | 42 +++++++++----------
 .../transformers/scalers/standard_scaler.py   | 18 ++++++++
 .../components/transformers/transformer.py    | 15 +++++--
 .../tests/component_tests/test_components.py  |  6 +--
 5 files changed, 57 insertions(+), 32 deletions(-)

diff --git a/evalml/pipelines/components/transformers/encoders/target_encoder.py b/evalml/pipelines/components/transformers/encoders/target_encoder.py
index 2156a512b6..ea97d2d5a0 100644
--- a/evalml/pipelines/components/transformers/encoders/target_encoder.py
+++ b/evalml/pipelines/components/transformers/encoders/target_encoder.py
@@ -58,11 +58,11 @@ def fit(self, X, y):
             y.reset_index(drop=True, inplace=True)
         return super().fit(X, y)
 
-    def transform(self, X, y=None):
-        return super().transform(X, y)
+    # def transform(self, X, y=None):
+    #     return super().transform(X, y)
 
-    def fit_transform(self, X, y):
-        return self.fit(X, y).transform(X)
+    # def fit_transform(self, X, y):
+    #     return self.fit(X, y).transform(X)
 
     def get_feature_names(self):
         """Return feature names for the input features after fitting.
diff --git a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
index 67ddcb717e..748ead4040 100644
--- a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
+++ b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
@@ -1,6 +1,10 @@
 import pandas as pd
 
 from evalml.pipelines.components.transformers import Transformer
+from evalml.utils.gen_utils import (
+    _convert_to_woodwork_structure,
+    _convert_woodwork_types_wrapper
+)
 
 
 class FeatureSelector(Transformer):
@@ -25,22 +29,19 @@ def transform(self, X, y=None):
         Returns:
             pd.DataFrame: Transformed X
         """
-        if isinstance(X, pd.DataFrame):
-            self.input_feature_names = list(X.columns.values)
-        else:
-            self.input_feature_names = range(X.shape[1])
+        X = _convert_to_woodwork_structure(X)
+        X = _convert_woodwork_types_wrapper(X.to_dataframe())
+        self.input_feature_names = list(X.columns.values)
 
         try:
             X_t = self._component_obj.transform(X)
         except AttributeError:
             raise RuntimeError("Transformer requires a transform method or a component_obj that implements transform")
-        if not isinstance(X_t, pd.DataFrame) and isinstance(X, pd.DataFrame):
-            X_dtypes = X.dtypes.to_dict()
-            selected_col_names = self.get_names()
-            col_types = {key: X_dtypes[key] for key in selected_col_names}
-            return pd.DataFrame(X_t, columns=selected_col_names, index=X.index).astype(col_types)
-        else:
-            return pd.DataFrame(X_t)
+        X_dtypes = X.dtypes.to_dict()
+        selected_col_names = self.get_names()
+        col_types = {key: X_dtypes[key] for key in selected_col_names}
+        features = pd.DataFrame(X_t, columns=selected_col_names, index=X.index).astype(col_types)
+        return _convert_to_woodwork_structure(features)
 
     def fit_transform(self, X, y=None):
         """Fits feature selector on data X then transforms X by selecting features
@@ -52,19 +53,16 @@ def fit_transform(self, X, y=None):
         Returns:
             pd.DataFrame: Transformed X
         """
-        if isinstance(X, pd.DataFrame):
-            self.input_feature_names = list(X.columns.values)
-        else:
-            self.input_feature_names = range(X.shape[1])
+        X = _convert_to_woodwork_structure(X)
+        X = _convert_woodwork_types_wrapper(X.to_dataframe())
+        self.input_feature_names = list(X.columns.values)
 
         try:
             X_t = self._component_obj.fit_transform(X, y)
         except AttributeError:
             raise RuntimeError("Transformer requires a fit_transform method or a component_obj that implements fit_transform")
-        if not isinstance(X_t, pd.DataFrame) and isinstance(X, pd.DataFrame):
-            X_dtypes = X.dtypes.to_dict()
-            selected_col_names = self.get_names()
-            col_types = {key: X_dtypes[key] for key in selected_col_names}
-            return pd.DataFrame(X_t, columns=selected_col_names, index=X.index).astype(col_types)
-        else:
-            return pd.DataFrame(X_t)
+        X_dtypes = X.dtypes.to_dict()
+        selected_col_names = self.get_names()
+        col_types = {key: X_dtypes[key] for key in selected_col_names}
+        features = pd.DataFrame(X_t, columns=selected_col_names, index=X.index).astype(col_types)
+        return _convert_to_woodwork_structure(features)
diff --git a/evalml/pipelines/components/transformers/scalers/standard_scaler.py b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
index 9189dd6c01..38d70c4bcc 100644
--- a/evalml/pipelines/components/transformers/scalers/standard_scaler.py
+++ b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
@@ -1,6 +1,11 @@
+import pandas as pd
 from sklearn.preprocessing import StandardScaler as SkScaler
 
 from evalml.pipelines.components.transformers import Transformer
+from evalml.utils.gen_utils import (
+    _convert_to_woodwork_structure,
+    _convert_woodwork_types_wrapper
+)
 
 
 class StandardScaler(Transformer):
@@ -16,3 +21,16 @@ def __init__(self, random_state=0, **kwargs):
         super().__init__(parameters=parameters,
                          component_obj=scaler,
                          random_state=random_state)
+
+    def transform(self, X, y=None):
+
+        X = _convert_to_woodwork_structure(X)
+        X = _convert_woodwork_types_wrapper(X.to_dataframe())
+        X_cols = X.columns
+        X_index = X.index
+        X_t = self._component_obj.transform(X)
+        X_t_df = pd.DataFrame(X_t, columns=X_cols, index=X_index)
+        return _convert_to_woodwork_structure(X_t_df)
+
+    def fit_transform(self, X, y=None):
+        return self.fit(X, y).transform(X, y)
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index f9f421bd4b..18baff27be 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -1,3 +1,5 @@
+import pandas as pd
+
 from evalml.exceptions import MethodPropertyNotFoundError
 from evalml.model_family import ModelFamily
 from evalml.pipelines.components import ComponentBase
@@ -33,13 +35,20 @@ def transform(self, X, y=None):
             ww.DataTable: Transformed X
         """
         try:
-            X_t = self._component_obj.transform(X)
+            X = _convert_to_woodwork_structure(X)
+            X = _convert_woodwork_types_wrapper(X.to_dataframe())
+            if y is not None:
+                y = _convert_to_woodwork_structure(y)
+                y = _convert_woodwork_types_wrapper(y.to_series())
+            X_cols = X.columns
+            X_index = X.index
+            X_t = self._component_obj.transform(X, y)
         except AttributeError:
             raise MethodPropertyNotFoundError("Transformer requires a transform method or a component_obj that implements transform")
         # if isinstance(X, pd.DataFrame):
             # return _convert_to_woodwork_structure(pd.DataFrame(X_t, columns=X.columns, index=X.index))
-
-        return _convert_to_woodwork_structure(X_t)
+        X_t_df = pd.DataFrame(X_t, columns=X_cols, index=X_index)
+        return _convert_to_woodwork_structure(X_t_df)
 
     def fit_transform(self, X, y=None):
         """Fits on X and transforms X
diff --git a/evalml/tests/component_tests/test_components.py b/evalml/tests/component_tests/test_components.py
index 7487a51436..817489e58a 100644
--- a/evalml/tests/component_tests/test_components.py
+++ b/evalml/tests/component_tests/test_components.py
@@ -554,7 +554,7 @@ def test_transformer_transform_output_type(X_y_binary):
                 continue
             else:
                 assert transform_output.shape == X.shape
-                assert (list(transform_output.columns) == X_cols_expected).all()
+                assert (list(transform_output.columns) == list(X_cols_expected))
 
             transform_output = component.fit_transform(X, y=y)
             assert isinstance(transform_output, ww.DataTable)
@@ -572,7 +572,7 @@ def test_transformer_transform_output_type(X_y_binary):
                 assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             else:
                 assert transform_output.shape == X.shape
-                assert (transform_output.to_dataframe().columns == X_cols_expected).all()
+                assert (list(transform_output.columns) == list(X_cols_expected))
 
 
 @pytest.mark.parametrize("cls", [cls for cls in all_components() if cls not in [StackedEnsembleRegressor, StackedEnsembleClassifier]])
@@ -631,7 +631,7 @@ def __init__(self):
         def fit(self, X, y):
             pass
 
-        def transform(self, X):
+        def transform(self, X, y=None):
             return pd.DataFrame()
 
     class MockTransformer(Transformer):

From d619154cb5a82385a567e3e249076dbe1b4aee89 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 12 Jan 2021 17:44:23 -0500
Subject: [PATCH 24/98] fix more pipeline tests

---
 evalml/pipelines/classification_pipeline.py   | 10 ++++--
 evalml/pipelines/component_graph.py           | 32 ++++++++++++++++---
 evalml/pipelines/components/utils.py          | 10 ++++--
 .../time_series_classification_pipelines.py   | 25 +++++++++++++--
 .../time_series_regression_pipeline.py        | 11 ++++++-
 .../test_cost_benefit_matrix.py               |  2 +-
 .../pipeline_tests/test_component_graph.py    |  7 ++--
 evalml/tests/pipeline_tests/test_pipelines.py | 30 +++++++++--------
 evalml/utils/gen_utils.py                     |  4 +--
 9 files changed, 98 insertions(+), 33 deletions(-)

diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index 9fd4811fba..3ce7631ddf 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -91,6 +91,7 @@ def predict(self, X, objective=None):
             pd.Series : Estimated labels
         """
         predictions = self._predict(X, objective)
+        predictions = predictions.to_series()
         predictions = pd.Series(self._decode_targets(predictions), name=self.input_target_name)
         return _convert_to_woodwork_structure(predictions)
 
@@ -124,8 +125,13 @@ def score(self, X, y, objectives):
         objectives = [get_objective(o, return_instance=True) for o in objectives]
         y = self._encode_targets(y)
         y_predicted, y_predicted_proba = self._compute_predictions(X, objectives)
-        y_predicted = _convert_to_woodwork_structure(y_predicted)
-        y_predicted_proba = _convert_to_woodwork_structure(y_predicted_proba)
+        if y_predicted is not None:
+            y_predicted = _convert_to_woodwork_structure(y_predicted)
+            y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
+
+        if y_predicted_proba is not None:
+            y_predicted_proba = _convert_to_woodwork_structure(y_predicted_proba)
+            y_predicted_proba = _convert_woodwork_types_wrapper(y_predicted_proba.to_dataframe())
         return self._score_all_objectives(X, y, y_predicted, y_predicted_proba, objectives)
 
     def _compute_predictions(self, X, objectives):
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 74fc488f5c..3ffed33f82 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -6,7 +6,11 @@
 
 from evalml.pipelines.components import ComponentBase, Estimator, Transformer
 from evalml.pipelines.components.utils import handle_component_class
-from evalml.utils import get_random_state, import_or_raise
+from evalml.utils import (
+    _convert_to_woodwork_structure,
+    get_random_state,
+    import_or_raise
+)
 
 
 class ComponentGraph:
@@ -104,9 +108,16 @@ def fit_features(self, X, y):
         for parent in self.get_parents(self.compute_order[-1]):
             parent_output = component_outputs.get(parent, component_outputs.get(f'{parent}.x'))
             if isinstance(parent_output, pd.Series):
+                # this shouldnt happen anymore, datacolumn
                 parent_output = pd.DataFrame(parent_output, columns=[parent])
+            if isinstance(parent_output, ww.DataColumn):
+                parent_output = parent_output.to_series()
+                parent_output = pd.DataFrame(parent_output, columns=[parent])
+                parent_output = _convert_to_woodwork_structure(parent_output)
             final_component_inputs.append(parent_output)
-        return pd.concat(final_component_inputs, axis=1)
+
+        concatted = pd.concat([component_input.to_dataframe() for component_input in final_component_inputs], axis=1)
+        return _convert_to_woodwork_structure(concatted)
 
     def predict(self, X):
         """Make predictions using selected features.
@@ -124,6 +135,7 @@ def predict(self, X):
         return outputs.get(final_component, outputs.get(f'{final_component}.x'))
 
     def compute_final_component_features(self, X, y=None):
+        ### TODO: COMBINE WITH fit_features
         """ Transform all components save the final one, and gathers the data from any number of parents
         to get all the information that should be fed to the final component
 
@@ -141,9 +153,17 @@ def compute_final_component_features(self, X, y=None):
         for parent in self.get_parents(self.compute_order[-1]):
             parent_output = component_outputs.get(parent, component_outputs.get(f'{parent}.x'))
             if isinstance(parent_output, pd.Series):
+                # shouldnt happen...
                 parent_output = pd.DataFrame(parent_output, columns=[parent])
+            if isinstance(parent_output, ww.DataColumn):
+                parent_output = parent_output.to_series()
+                parent_output = pd.DataFrame(parent_output, columns=[parent])
+                parent_output = _convert_to_woodwork_structure(parent_output)
             final_component_inputs.append(parent_output)
-        return pd.concat(final_component_inputs, axis=1)
+        # concatted = pd.concat([i.to_dataframe() for i in final_component_inputs], axis=1)
+        concatted = pd.concat([i.to_dataframe() if isinstance(i, ww.DataTable) else i for i in final_component_inputs], axis=1)
+
+        return _convert_to_woodwork_structure(concatted)
 
     def _compute_features(self, component_list, X, y=None, fit=False):
         """Transforms the data by applying the given components.
@@ -181,6 +201,10 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                     parent_x = output_cache.get(parent_input, output_cache.get(f'{parent_input}.x'))
                     if isinstance(parent_x, pd.Series):
                         parent_x = pd.DataFrame(parent_x, columns=[parent_input])
+                    if isinstance(parent_x, ww.DataColumn):
+                        parent_x_series = parent_x.to_series()
+                        parent_x = pd.DataFrame(parent_x_series, columns=[parent_input])
+                        parent_x = _convert_to_woodwork_structure(parent_x)
                     x_inputs.append(parent_x)
             input_x, input_y = self._consolidate_inputs(x_inputs, y_input, X, y)
             self.input_feature_names.update({component_name: list(input_x.columns)})
@@ -223,7 +247,7 @@ def _consolidate_inputs(x_inputs, y_input, X, y):
         if len(x_inputs) == 0:
             return_x = X
         else:
-            return_x = pd.concat(x_inputs, axis=1)
+            return_x = pd.concat([x_in.to_dataframe() if isinstance(x_in, ww.DataTable) else x_in for x_in in x_inputs], axis=1)
         return_y = y
         if y_input is not None:
             return_y = y_input
diff --git a/evalml/pipelines/components/utils.py b/evalml/pipelines/components/utils.py
index f91d6a12a0..b9bf06891c 100644
--- a/evalml/pipelines/components/utils.py
+++ b/evalml/pipelines/components/utils.py
@@ -9,7 +9,10 @@
 from evalml.pipelines.components import ComponentBase, Estimator, Transformer
 from evalml.problem_types import ProblemTypes, handle_problem_types
 from evalml.utils import get_logger
-from evalml.utils.gen_utils import get_importable_subclasses
+from evalml.utils.gen_utils import (
+    _convert_woodwork_types_wrapper,
+    get_importable_subclasses
+)
 
 logger = get_logger(__file__)
 
@@ -147,7 +150,8 @@ def predict(self, X):
             pd.Series: Predicted values
         """
         check_is_fitted(self, 'is_fitted_')
-        return self.pipeline.predict(X).to_series().to_numpy()
+
+        return _convert_woodwork_types_wrapper(self.pipeline.predict(X).to_series()).to_numpy()
 
     def predict_proba(self, X):
         """Make probability estimates for labels.
@@ -158,7 +162,7 @@ def predict_proba(self, X):
         Returns:
             pd.DataFrame: Probability estimates
         """
-        return self.pipeline.predict_proba(X).to_dataframe().to_numpy()
+        return _convert_woodwork_types_wrapper(self.pipeline.predict_proba(X).to_dataframe()).to_numpy()
 
 
 class WrappedSKRegressor(BaseEstimator, RegressorMixin):
diff --git a/evalml/pipelines/time_series_classification_pipelines.py b/evalml/pipelines/time_series_classification_pipelines.py
index 2f035c3db2..759d6df684 100644
--- a/evalml/pipelines/time_series_classification_pipelines.py
+++ b/evalml/pipelines/time_series_classification_pipelines.py
@@ -1,4 +1,5 @@
 import pandas as pd
+import woodwork as ww
 
 from evalml.objectives import get_objective
 from evalml.pipelines.classification_pipeline import ClassificationPipeline
@@ -60,7 +61,7 @@ def fit(self, X, y):
         y = self._encode_targets(y)
 
         X_t = self._compute_features_during_fit(X, y)
-
+        X_t = _convert_woodwork_types_wrapper(X_t.to_dataframe())
         y_shifted = y.shift(-self.gap)
         X_t, y_shifted = drop_rows_with_nans(X_t, y_shifted)
         self.estimator.fit(X_t, y_shifted)
@@ -89,6 +90,12 @@ def _estimator_predict_proba(self, features, y):
     def _predict(self, X, y, objective=None, pad=False):
         y_encoded = self._encode_targets(y)
         features = self.compute_estimator_features(X, y_encoded)
+        if isinstance(features, ww.DataTable):
+            features = _convert_woodwork_types_wrapper(features.to_dataframe())
+        elif isinstance(features, ww.DataColumn):
+            features = _convert_woodwork_types_wrapper(features.to_series())
+
+        # features = _convert_woodwork_types_wrapper(features.to_series())
         features_no_nan, y_encoded = drop_rows_with_nans(features, y_encoded)
         predictions = self._estimator_predict(features_no_nan, y_encoded)
         if pad:
@@ -111,8 +118,14 @@ def predict(self, X, y=None, objective=None):
         y = _convert_woodwork_types_wrapper(y.to_series())
         n_features = max(len(y), X.shape[0])
         predictions = self._predict(X, y, objective=objective, pad=False)
+        if isinstance(predictions, ww.DataTable):
+            predictions = _convert_woodwork_types_wrapper(predictions.to_dataframe())
+        elif isinstance(predictions, ww.DataColumn):
+            predictions = _convert_woodwork_types_wrapper(predictions.to_series())
+
         predictions = pd.Series(self._decode_targets(predictions), name=self.input_target_name)
-        return pad_with_nans(predictions, max(0, n_features - predictions.shape[0]))
+        padded = pad_with_nans(predictions, max(0, n_features - predictions.shape[0]))
+        return _convert_to_woodwork_structure(padded)
 
     def predict_proba(self, X, y=None):
         """Make probability estimates for labels.
@@ -131,7 +144,8 @@ def predict_proba(self, X, y=None):
         features_no_nan, y_encoded = drop_rows_with_nans(features, y_encoded)
         proba = self._estimator_predict_proba(features_no_nan, y_encoded)
         proba.columns = self._encoder.classes_
-        return pad_with_nans(proba, max(0, features.shape[0] - proba.shape[0]))
+        padded = pad_with_nans(proba, max(0, features.shape[0] - proba.shape[0]))
+        return _convert_to_woodwork_structure(padded)
 
     def _compute_predictions(self, X, y, objectives):
         """Compute predictions/probabilities based on objectives."""
@@ -183,6 +197,11 @@ def threshold(self, value):
     def _predict(self, X, y, objective=None, pad=False):
         y_encoded = self._encode_targets(y)
         features = self.compute_estimator_features(X, y_encoded)
+        if isinstance(features, ww.DataTable):
+            features = _convert_woodwork_types_wrapper(features.to_dataframe())
+        elif isinstance(features, ww.DataColumn):
+            features = _convert_woodwork_types_wrapper(features.to_series())
+
         features_no_nan, y_encoded = drop_rows_with_nans(features, y_encoded)
 
         if objective is not None:
diff --git a/evalml/pipelines/time_series_regression_pipeline.py b/evalml/pipelines/time_series_regression_pipeline.py
index 6148aea604..6996481ae2 100644
--- a/evalml/pipelines/time_series_regression_pipeline.py
+++ b/evalml/pipelines/time_series_regression_pipeline.py
@@ -1,4 +1,5 @@
 import pandas as pd
+import woodwork as ww
 
 from evalml.objectives import get_objective
 from evalml.pipelines.regression_pipeline import RegressionPipeline
@@ -55,6 +56,7 @@ def fit(self, X, y):
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         y = _convert_woodwork_types_wrapper(y.to_series())
         X_t = self._compute_features_during_fit(X, y)
+        X_t = X_t.to_dataframe()
 
         y_shifted = y.shift(-self.gap)
         X_t, y_shifted = drop_rows_with_nans(X_t, y_shifted)
@@ -79,13 +81,20 @@ def predict(self, X, y=None, objective=None):
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         y = _convert_woodwork_types_wrapper(y.to_series())
         features = self.compute_estimator_features(X, y)
+        if isinstance(features, ww.DataTable):
+            features = _convert_woodwork_types_wrapper(features.to_dataframe())
+        elif isinstance(features, ww.DataColumn):
+            features = _convert_woodwork_types_wrapper(features.to_series())
+
         features_no_nan, y = drop_rows_with_nans(features, y)
         y_arg = None
         if self.estimator.predict_uses_y:
             y_arg = y
         predictions = self.estimator.predict(features_no_nan, y_arg)
+        predictions = predictions.to_series()
         predictions = predictions.rename(self.input_target_name)
-        return pad_with_nans(predictions, max(0, features.shape[0] - predictions.shape[0]))
+        padded = pad_with_nans(predictions, max(0, features.shape[0] - predictions.shape[0]))
+        return _convert_to_woodwork_structure(padded)
 
     def score(self, X, y, objectives):
         """Evaluate model performance on current and additional objectives.
diff --git a/evalml/tests/objective_tests/test_cost_benefit_matrix.py b/evalml/tests/objective_tests/test_cost_benefit_matrix.py
index 46779efd16..94746cb492 100644
--- a/evalml/tests/objective_tests/test_cost_benefit_matrix.py
+++ b/evalml/tests/objective_tests/test_cost_benefit_matrix.py
@@ -32,7 +32,7 @@ def test_cbm_objective_automl(optimize_thresholds, X_y_binary):
     pipeline = automl.best_pipeline
     pipeline.fit(X, y)
     assert not np.isnan(pipeline.predict(X, cbm)).values.any()
-    assert not np.isnan(pipeline.predict_proba(X)).values.any()
+    assert not np.isnan(pipeline.predict_proba(X).to_dataframe()).values.any()
     assert not np.isnan(pipeline.score(X, y, [cbm])['Cost Benefit Matrix'])
     assert not np.isnan(list(pipeline.predict(X, cbm))).any()
 
diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index ba3665e388..00dc664431 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -3,6 +3,7 @@
 import numpy as np
 import pandas as pd
 import pytest
+from pandas.testing import assert_frame_equal
 
 from evalml.exceptions import MissingComponentError
 from evalml.pipelines import ComponentGraph
@@ -458,7 +459,7 @@ def test_compute_final_component_features_linear(mock_ohe, mock_imputer, X_y_bin
     component_graph.fit(X, y)
 
     X_t = component_graph.compute_final_component_features(X)
-    pd.testing.assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_t, X_expected)
     assert mock_imputer.call_count == 2
     assert mock_ohe.call_count == 2
 
@@ -478,7 +479,7 @@ def test_compute_final_component_features_nonlinear(mock_en_predict, mock_rf_pre
     component_graph.fit(X, y)
 
     X_t = component_graph.compute_final_component_features(X)
-    pd.testing.assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
     assert mock_imputer.call_count == 2
     assert mock_ohe.call_count == 4
 
@@ -492,7 +493,7 @@ def test_compute_final_component_features_single_component(mock_transform, X_y_b
     component_graph.fit(X, y)
 
     X_t = component_graph.compute_final_component_features(X)
-    pd.testing.assert_frame_equal(X_t, X)
+    assert_frame_equal(X, X_t.to_dataframe())
 
 
 @patch('evalml.pipelines.components.Imputer.fit_transform')
diff --git a/evalml/tests/pipeline_tests/test_pipelines.py b/evalml/tests/pipeline_tests/test_pipelines.py
index 35bfa71658..d375aaa799 100644
--- a/evalml/tests/pipeline_tests/test_pipelines.py
+++ b/evalml/tests/pipeline_tests/test_pipelines.py
@@ -6,6 +6,7 @@
 import pandas as pd
 import pytest
 import woodwork as ww
+from pandas.testing import assert_frame_equal
 from skopt.space import Integer, Real
 
 from evalml.demos import load_breast_cancer, load_wine
@@ -1061,6 +1062,7 @@ def test_compute_estimator_features(mock_scaler, mock_ohe, mock_imputer, X_y_bin
     X, y = X_y_binary
     X = pd.DataFrame(X)
     X_expected = pd.DataFrame(index=X.index, columns=X.columns).fillna(0)
+    X_expected = X_expected.astype("Int64")
     mock_imputer.return_value = X
     mock_ohe.return_value = X
     mock_scaler.return_value = X_expected
@@ -1069,10 +1071,10 @@ def test_compute_estimator_features(mock_scaler, mock_ohe, mock_imputer, X_y_bin
     pipeline.fit(X, y)
 
     X_t = pipeline.compute_estimator_features(X)
-    pd.testing.assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
     assert mock_imputer.call_count == 2
     assert mock_ohe.call_count == 2
-    assert mock_scaler.call_count == 1
+    assert mock_scaler.call_count == 2
 
 
 @patch('evalml.pipelines.components.Imputer.transform')
@@ -1081,17 +1083,17 @@ def test_compute_estimator_features(mock_scaler, mock_ohe, mock_imputer, X_y_bin
 @patch('evalml.pipelines.components.ElasticNetClassifier.predict')
 def test_compute_estimator_features_nonlinear(mock_en_predict, mock_rf_predict, mock_ohe, mock_imputer, X_y_binary, nonlinear_binary_pipeline_class):
     X, y = X_y_binary
-    mock_imputer.return_value = pd.DataFrame(X)
-    mock_ohe.return_value = pd.DataFrame(X)
-    mock_en_predict.return_value = pd.Series(np.ones(X.shape[0]))
-    mock_rf_predict.return_value = pd.Series(np.zeros(X.shape[0]))
+    ### TODO: can clean
+    mock_imputer.return_value = ww.DataTable(pd.DataFrame(X))
+    mock_ohe.return_value = ww.DataTable(pd.DataFrame(X))
+    mock_en_predict.return_value = ww.DataColumn(pd.Series(np.ones(X.shape[0])))
+    mock_rf_predict.return_value = ww.DataColumn(pd.Series(np.zeros(X.shape[0])))
     X_expected = pd.DataFrame({'Random Forest': np.zeros(X.shape[0]), 'Elastic Net': np.ones(X.shape[0])})
 
     pipeline = nonlinear_binary_pipeline_class({})
     pipeline.fit(X, y)
-
     X_t = pipeline.compute_estimator_features(X)
-    pd.testing.assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
     assert mock_imputer.call_count == 2
     assert mock_ohe.call_count == 4
     assert mock_en_predict.call_count == 2
@@ -1316,7 +1318,7 @@ class MockPipelineNone(BinaryClassificationPipeline):
 @patch('evalml.pipelines.components.Estimator.predict')
 def test_score_with_objective_that_requires_predict_proba(mock_predict, dummy_regression_pipeline_class, X_y_binary):
     X, y = X_y_binary
-    mock_predict.return_value = pd.Series([1] * 100)
+    mock_predict.return_value = ww.DataColumn(pd.Series([1] * 100))
     # Using pytest.raises to make sure we error if an error is not thrown.
     with pytest.raises(PipelineScoreError):
         clf = dummy_regression_pipeline_class(parameters={})
@@ -1460,7 +1462,7 @@ def test_clone_fitted(X_y_binary, logistic_regression_binary_pipeline_class):
         pipeline_clone.predict(X)
     pipeline_clone.fit(X, y)
     X_t_clone = pipeline_clone.predict_proba(X)
-    pd.testing.assert_frame_equal(X_t, X_t_clone)
+    assert_frame_equal(X_t.to_dataframe(), X_t_clone.to_dataframe())
 
 
 def test_nonlinear_clone_fitted(X_y_binary, nonlinear_binary_pipeline_class):
@@ -1477,7 +1479,7 @@ def test_nonlinear_clone_fitted(X_y_binary, nonlinear_binary_pipeline_class):
         pipeline_clone.predict(X)
     pipeline_clone.fit(X, y)
     X_t_clone = pipeline_clone.predict_proba(X)
-    pd.testing.assert_frame_equal(X_t, X_t_clone)
+    assert_frame_equal(X_t.to_dataframe(), X_t_clone.to_dataframe())
 
 
 def test_feature_importance_has_feature_names(X_y_binary, logistic_regression_binary_pipeline_class):
@@ -1639,7 +1641,7 @@ def test_targets_data_types_classification_pipelines(data_type, problem_type, ta
     for pipeline_class in pipeline_classes:
         pipeline = helper_functions.safe_init_pipeline_with_njobs_1(pipeline_class)
         pipeline.fit(X, y)
-        predictions = pipeline.predict(X, objective)
+        predictions = pipeline.predict(X, objective).to_series()
         assert set(predictions.unique()).issubset(unique_vals)
         predict_proba = pipeline.predict_proba(X)
         assert set(predict_proba.columns) == set(unique_vals)
@@ -1768,13 +1770,13 @@ class StackedPipeline(base_pipeline_class):
     pipeline = StackedPipeline(parameters=parameters)
     pipeline.fit(X, y)
     comparison_pipeline.fit(X, y)
-    assert not np.isnan(pipeline.predict(X)).values.any()
+    assert not np.isnan(pipeline.predict(X).to_series()).values.any()
 
     pipeline_score = pipeline.score(X, y, [objective])[objective]
     comparison_pipeline_score = comparison_pipeline.score(X, y, [objective])[objective]
 
     if problem_type == ProblemTypes.BINARY or problem_type == ProblemTypes.MULTICLASS:
-        assert not np.isnan(pipeline.predict_proba(X)).values.any()
+        assert not np.isnan(pipeline.predict_proba(X).to_dataframe()).values.any()
         assert (pipeline_score <= comparison_pipeline_score)
     else:
         assert (pipeline_score >= comparison_pipeline_score)
diff --git a/evalml/utils/gen_utils.py b/evalml/utils/gen_utils.py
index e5e6de9a0a..da0cca4f48 100644
--- a/evalml/utils/gen_utils.py
+++ b/evalml/utils/gen_utils.py
@@ -359,14 +359,14 @@ def _convert_woodwork_types_wrapper(pd_data):
 
 def pad_with_nans(pd_data, num_to_pad):
     """Pad the beginning num_to_pad rows with nans.
-
+        TODO
     Arguments:
         pd_data (pd.DataFrame or pd.Series): Data to pad.
 
     Returns:
         pd.DataFrame or pd.Series
     """
-    if isinstance(pd_data, pd.Series):
+    if isinstance(pd_data, pd.Series) or isinstance(pd_data, ww.DataColumn):
         padding = pd.Series([np.nan] * num_to_pad, name=pd_data.name)
     else:
         padding = pd.DataFrame({col: [np.nan] * num_to_pad

From 90a419083281f80ea9f1acaca1528e26da5cc592 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 12 Jan 2021 18:19:45 -0500
Subject: [PATCH 25/98] fix stacked ensemble component tests

---
 .../test_stacked_ensemble_classifier.py       | 23 ++++++++++---------
 .../test_stacked_ensemble_regressor.py        | 15 ++++++------
 2 files changed, 20 insertions(+), 18 deletions(-)

diff --git a/evalml/tests/component_tests/test_stacked_ensemble_classifier.py b/evalml/tests/component_tests/test_stacked_ensemble_classifier.py
index 5fe69137e6..058e27a468 100644
--- a/evalml/tests/component_tests/test_stacked_ensemble_classifier.py
+++ b/evalml/tests/component_tests/test_stacked_ensemble_classifier.py
@@ -3,6 +3,7 @@
 import numpy as np
 import pandas as pd
 import pytest
+import woodwork as ww
 
 from evalml.exceptions import EnsembleMissingPipelinesError
 from evalml.model_family import ModelFamily
@@ -62,7 +63,7 @@ def test_stacked_ensemble_init_with_multiple_same_estimators(X_y_binary, logisti
     clf.fit(X, y)
     y_pred = clf.predict(X)
     assert len(y_pred) == len(y)
-    assert not np.isnan(y_pred).all()
+    assert not np.isnan(y_pred.to_series()).all()
 
 
 def test_stacked_ensemble_n_jobs_negative_one(X_y_binary, logistic_regression_binary_pipeline_class):
@@ -79,7 +80,7 @@ def test_stacked_ensemble_n_jobs_negative_one(X_y_binary, logistic_regression_bi
     clf.fit(X, y)
     y_pred = clf.predict(X)
     assert len(y_pred) == len(y)
-    assert not np.isnan(y_pred).all()
+    assert not np.isnan(y_pred.to_series()).all()
 
 
 @patch('evalml.pipelines.components.ensemble.StackedEnsembleClassifier._stacking_estimator_class')
@@ -105,7 +106,7 @@ def test_stacked_ensemble_multilevel(logistic_regression_binary_pipeline_class):
     clf.fit(X, y)
     y_pred = clf.predict(X)
     assert len(y_pred) == len(y)
-    assert not np.isnan(y_pred).all()
+    assert not np.isnan(y_pred.to_series()).all()
 
 
 def test_stacked_problem_types():
@@ -131,25 +132,25 @@ def test_stacked_fit_predict_classification(X_y_binary, X_y_multi, stackable_cla
     clf.fit(X, y)
     y_pred = clf.predict(X)
     assert len(y_pred) == len(y)
-    assert isinstance(y_pred, pd.Series)
-    assert not np.isnan(y_pred).all()
+    assert isinstance(y_pred, ww.DataColumn)
+    assert not np.isnan(y_pred.to_series()).all()
 
     y_pred_proba = clf.predict_proba(X)
-    assert isinstance(y_pred_proba, pd.DataFrame)
+    assert isinstance(y_pred_proba, ww.DataTable)
     assert y_pred_proba.shape == (len(y), num_classes)
-    assert not np.isnan(y_pred_proba).all().all()
+    assert not np.isnan(y_pred_proba.to_dataframe()).all().all()
 
     clf = StackedEnsembleClassifier(input_pipelines=input_pipelines, final_estimator=RandomForestClassifier(), n_jobs=1)
     clf.fit(X, y)
     y_pred = clf.predict(X)
     assert len(y_pred) == len(y)
-    assert isinstance(y_pred, pd.Series)
-    assert not np.isnan(y_pred).all()
+    assert isinstance(y_pred, ww.DataColumn)
+    assert not np.isnan(y_pred.to_series()).all()
 
     y_pred_proba = clf.predict_proba(X)
     assert y_pred_proba.shape == (len(y), num_classes)
-    assert isinstance(y_pred_proba, pd.DataFrame)
-    assert not np.isnan(y_pred_proba).all().all()
+    assert isinstance(y_pred_proba, ww.DataTable)
+    assert not np.isnan(y_pred_proba.to_dataframe()).all().all()
 
 
 @pytest.mark.parametrize("problem_type", [ProblemTypes.BINARY, ProblemTypes.MULTICLASS])
diff --git a/evalml/tests/component_tests/test_stacked_ensemble_regressor.py b/evalml/tests/component_tests/test_stacked_ensemble_regressor.py
index 30be5ee549..f0d118c331 100644
--- a/evalml/tests/component_tests/test_stacked_ensemble_regressor.py
+++ b/evalml/tests/component_tests/test_stacked_ensemble_regressor.py
@@ -3,6 +3,7 @@
 import numpy as np
 import pandas as pd
 import pytest
+import woodwork as ww
 
 from evalml.exceptions import EnsembleMissingPipelinesError
 from evalml.model_family import ModelFamily
@@ -63,7 +64,7 @@ def test_stacked_ensemble_init_with_multiple_same_estimators(X_y_regression, lin
     clf.fit(X, y)
     y_pred = clf.predict(X)
     assert len(y_pred) == len(y)
-    assert not np.isnan(y_pred).all()
+    assert not np.isnan(y_pred.to_series()).all()
 
 
 def test_stacked_ensemble_n_jobs_negative_one(X_y_regression, linear_regression_pipeline_class):
@@ -80,7 +81,7 @@ def test_stacked_ensemble_n_jobs_negative_one(X_y_regression, linear_regression_
     clf.fit(X, y)
     y_pred = clf.predict(X)
     assert len(y_pred) == len(y)
-    assert not np.isnan(y_pred).all()
+    assert not np.isnan(y_pred.to_series()).all()
 
 
 @patch('evalml.pipelines.components.ensemble.StackedEnsembleRegressor._stacking_estimator_class')
@@ -106,7 +107,7 @@ def test_stacked_ensemble_multilevel(linear_regression_pipeline_class):
     clf.fit(X, y)
     y_pred = clf.predict(X)
     assert len(y_pred) == len(y)
-    assert not np.isnan(y_pred).all()
+    assert not np.isnan(y_pred.to_series()).all()
 
 
 def test_stacked_problem_types():
@@ -122,15 +123,15 @@ def test_stacked_fit_predict_regression(X_y_regression, stackable_regressors):
     clf.fit(X, y)
     y_pred = clf.predict(X)
     assert len(y_pred) == len(y)
-    assert isinstance(y_pred, pd.Series)
-    assert not np.isnan(y_pred).all()
+    assert isinstance(y_pred, ww.DataColumn)
+    assert not np.isnan(y_pred.to_series()).all()
 
     clf = StackedEnsembleRegressor(input_pipelines=input_pipelines, final_estimator=RandomForestRegressor(), n_jobs=1)
     clf.fit(X, y)
     y_pred = clf.predict(X)
     assert len(y_pred) == len(y)
-    assert isinstance(y_pred, pd.Series)
-    assert not np.isnan(y_pred).all()
+    assert isinstance(y_pred, ww.DataColumn)
+    assert not np.isnan(y_pred.to_series()).all()
 
 
 @patch('evalml.pipelines.components.ensemble.StackedEnsembleRegressor.fit')

From fa9f09827968d7b69c1ecaf0955606c1004e083a Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 12 Jan 2021 18:48:30 -0500
Subject: [PATCH 26/98] fix more tests in automl

---
 evalml/automl/automl_search.py                |  5 +++-
 .../binary_classification_pipeline.py         |  1 +
 evalml/pipelines/component_graph.py           |  1 +
 evalml/pipelines/regression_pipeline.py       |  2 +-
 evalml/tests/automl_tests/test_automl.py      | 24 ++++++++++---------
 5 files changed, 20 insertions(+), 13 deletions(-)

diff --git a/evalml/automl/automl_search.py b/evalml/automl/automl_search.py
index 18d907443b..f77dbd44cc 100644
--- a/evalml/automl/automl_search.py
+++ b/evalml/automl/automl_search.py
@@ -7,6 +7,7 @@
 import cloudpickle
 import numpy as np
 import pandas as pd
+import woodwork as ww
 from sklearn.model_selection import BaseCrossValidator
 
 from .pipeline_search_plots import PipelineSearchPlots
@@ -570,7 +571,9 @@ def _tune_binary_threshold(self, pipeline, X_threshold_tuning, y_threshold_tunin
             if X_threshold_tuning:
                 y_predict_proba = pipeline.predict_proba(X_threshold_tuning)
                 if isinstance(y_predict_proba, pd.DataFrame):
-                    y_predict_proba = y_predict_proba.iloc[:, 1]
+                    y_predict_proba = y_predict_proba.iloc[:, 1]  # shouldnt need
+                elif isinstance(y_predict_proba, ww.DataTable):
+                    y_predict_proba = y_predict_proba.to_dataframe().iloc[:, 1]
                 else:
                     y_predict_proba = y_predict_proba[:, 1]
                 pipeline.threshold = self.objective.optimize_threshold(y_predict_proba, y_threshold_tuning, X=X_threshold_tuning)
diff --git a/evalml/pipelines/binary_classification_pipeline.py b/evalml/pipelines/binary_classification_pipeline.py
index c3aadef773..5f7838d271 100644
--- a/evalml/pipelines/binary_classification_pipeline.py
+++ b/evalml/pipelines/binary_classification_pipeline.py
@@ -36,6 +36,7 @@ def _predict(self, X, objective=None):
         if self.threshold is None:
             return self._component_graph.predict(X)
         ypred_proba = self.predict_proba(X)
+        ypred_proba = ypred_proba.to_dataframe()
         ypred_proba = ypred_proba.iloc[:, 1]
         if objective is None:
             return ypred_proba > self.threshold
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 3ffed33f82..587505a66c 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -120,6 +120,7 @@ def fit_features(self, X, y):
         return _convert_to_woodwork_structure(concatted)
 
     def predict(self, X):
+        ### TODO
         """Make predictions using selected features.
 
         Arguments:
diff --git a/evalml/pipelines/regression_pipeline.py b/evalml/pipelines/regression_pipeline.py
index 444c0f5758..342a32011c 100644
--- a/evalml/pipelines/regression_pipeline.py
+++ b/evalml/pipelines/regression_pipeline.py
@@ -43,5 +43,5 @@ def score(self, X, y, objectives):
             dict: Ordered dictionary of objective scores
         """
         objectives = [get_objective(o, return_instance=True) for o in objectives]
-        y_predicted = self.predict(X)
+        y_predicted = self.predict(X).to_series()
         return self._score_all_objectives(X, y, y_predicted, y_pred_proba=None, objectives=objectives)
diff --git a/evalml/tests/automl_tests/test_automl.py b/evalml/tests/automl_tests/test_automl.py
index d4ccf5e6c3..c26f0cd9fd 100644
--- a/evalml/tests/automl_tests/test_automl.py
+++ b/evalml/tests/automl_tests/test_automl.py
@@ -418,17 +418,19 @@ def test_automl_bad_data_check_parameter_type():
         automl.search(data_checks=[MockDataCheckErrorAndWarning])
 
 
-@patch('evalml.pipelines.RegressionPipeline.fit')
-@patch('evalml.pipelines.RegressionPipeline.predict')
-@patch('evalml.data_checks.InvalidTargetDataCheck')
-def test_automl_passes_correct_objective_name_to_invalid_target_data_checks(mock_obj, mock_predict, mock_fit, X_y_regression):
-    X, y = X_y_regression
-    mock_obj.objective_name.return_value = "R2"
-    automl = AutoMLSearch(X, y, max_iterations=1, problem_type=ProblemTypes.REGRESSION)
-    automl.search()
-    mock_fit.assert_called()
-    mock_predict.assert_called()
-    assert automl.objective.name == mock_obj.objective_name.return_value
+# I don't think this tests what the name implies....
+# @patch('evalml.pipelines.RegressionPipeline.fit')
+# @patch('evalml.pipelines.RegressionPipeline.predict')
+# @patch('evalml.data_checks.InvalidTargetDataCheck')
+# def test_automl_passes_correct_objective_name_to_invalid_target_data_checks(mock_obj, mock_predict, mock_fit, X_y_regression):
+#     X, y = X_y_regression
+#     mock_obj.objective_name.return_value = "R2"
+#     mock_predict.return_value = ww.DataColumn(pd.Series([0] * len(y)))
+#     automl = AutoMLSearch(X, y, max_iterations=1, problem_type=ProblemTypes.REGRESSION)
+#     automl.search()
+#     mock_fit.assert_called()
+#     mock_predict.assert_called()
+#     assert automl.objective.name == mock_obj.objective_name.return_value
 
 
 class MockDataCheckObjective(DataCheck):

From 8e22a48f0c296f9c084461b4269ad86f10010ac4 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 12 Jan 2021 22:43:33 -0500
Subject: [PATCH 27/98] fix component graph and regression pipeline tests

---
 evalml/pipelines/component_graph.py           | 11 ++--
 .../transformers/encoders/target_encoder.py   |  8 +--
 .../test_classification.py                    |  7 +-
 .../test_regression.py                        |  8 +--
 .../pipeline_tests/test_component_graph.py    | 64 ++++++++++---------
 5 files changed, 53 insertions(+), 45 deletions(-)

diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 587505a66c..8c6991e16c 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -8,6 +8,7 @@
 from evalml.pipelines.components.utils import handle_component_class
 from evalml.utils import (
     _convert_to_woodwork_structure,
+    _convert_woodwork_types_wrapper,
     get_random_state,
     import_or_raise
 )
@@ -181,10 +182,8 @@ def _compute_features(self, component_list, X, y=None, fit=False):
         """
         if len(component_list) == 0:
             return X
-        if isinstance(X, ww.DataTable):
-            X = X.to_dataframe()
-        if not isinstance(X, pd.DataFrame):
-            X = pd.DataFrame(X)
+        X = _convert_to_woodwork_structure(X)
+        X = _convert_woodwork_types_wrapper(X.to_dataframe())
 
         output_cache = {}
         for component_name in component_list:
@@ -205,10 +204,12 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                     if isinstance(parent_x, ww.DataColumn):
                         parent_x_series = parent_x.to_series()
                         parent_x = pd.DataFrame(parent_x_series, columns=[parent_input])
-                        parent_x = _convert_to_woodwork_structure(parent_x)
+                        parent_x = _convert_to_woodwork_structure(parent_x).to_dataframe()
                     x_inputs.append(parent_x)
             input_x, input_y = self._consolidate_inputs(x_inputs, y_input, X, y)
+
             self.input_feature_names.update({component_name: list(input_x.columns)})
+
             if isinstance(component_instance, Transformer):
                 if fit:
                     output = component_instance.fit_transform(input_x, input_y)
diff --git a/evalml/pipelines/components/transformers/encoders/target_encoder.py b/evalml/pipelines/components/transformers/encoders/target_encoder.py
index ea97d2d5a0..dfbe849890 100644
--- a/evalml/pipelines/components/transformers/encoders/target_encoder.py
+++ b/evalml/pipelines/components/transformers/encoders/target_encoder.py
@@ -58,11 +58,11 @@ def fit(self, X, y):
             y.reset_index(drop=True, inplace=True)
         return super().fit(X, y)
 
-    # def transform(self, X, y=None):
-    #     return super().transform(X, y)
+    def transform(self, X, y=None):
+        return super().transform(X, y)
 
-    # def fit_transform(self, X, y):
-    #     return self.fit(X, y).transform(X)
+    def fit_transform(self, X, y):
+        return self.fit(X, y).transform(X, y)
 
     def get_feature_names(self):
         """Return feature names for the input features after fitting.
diff --git a/evalml/tests/pipeline_tests/classification_pipeline_tests/test_classification.py b/evalml/tests/pipeline_tests/classification_pipeline_tests/test_classification.py
index 5843d04fe3..f760a34a90 100644
--- a/evalml/tests/pipeline_tests/classification_pipeline_tests/test_classification.py
+++ b/evalml/tests/pipeline_tests/classification_pipeline_tests/test_classification.py
@@ -2,6 +2,7 @@
 
 import pandas as pd
 import pytest
+from pandas.testing import assert_series_equal
 
 from evalml.demos import load_breast_cancer, load_wine
 
@@ -46,12 +47,12 @@ def test_pipeline_has_classes_property(logistic_regression_binary_pipeline_class
         pipeline.classes_
 
     pipeline.fit(X, y)
-    pd.testing.assert_series_equal(pd.Series(pipeline.classes_), pd.Series(answer))
+    assert_series_equal(pd.Series(pipeline.classes_), pd.Series(answer))
 
 
 def test_woodwork_classification_pipeline(logistic_regression_binary_pipeline_class):
     X, y = load_breast_cancer()
     mock_pipeline = logistic_regression_binary_pipeline_class(parameters={"Logistic Regression Classifier": {"n_jobs": 1}})
     mock_pipeline.fit(X, y)
-    assert not pd.isnull(mock_pipeline.predict(X)).any()
-    assert not pd.isnull(mock_pipeline.predict_proba(X)).any().any()
+    assert not pd.isnull(mock_pipeline.predict(X).to_series()).any()
+    assert not pd.isnull(mock_pipeline.predict_proba(X).to_dataframe()).any().any()
diff --git a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
index 03726c60ca..6732e7bf1b 100644
--- a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
+++ b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
@@ -21,9 +21,9 @@ def test_invalid_targets_regression_pipeline(target_type, dummy_regression_pipel
 
 def test_woodwork_regression_pipeline(linear_regression_pipeline_class):
     X, y = load_diabetes()
-    mock_regression_pipeline = linear_regression_pipeline_class(parameters={'Linear Regressor': {'n_jobs': 1}})
-    mock_regression_pipeline.fit(X, y)
-    assert not pd.isnull(mock_regression_pipeline.predict(X)).any()
+    regression_pipeline = linear_regression_pipeline_class(parameters={'Linear Regressor': {'n_jobs': 1}})
+    regression_pipeline.fit(X, y)
+    assert not pd.isnull(regression_pipeline.predict(X).to_series()).any()
 
 
 def test_custom_indices():
@@ -35,6 +35,6 @@ class MyTargetPipeline(RegressionPipeline):
     X = pd.DataFrame({"a": ["a", "b", "a", "a", "a", "c", "c", "c"], "b": [0, 1, 1, 1, 1, 1, 0, 1]})
     y = pd.Series([0, 0, 0, 1, 0, 1, 0, 0], index=[7, 2, 1, 4, 5, 3, 6, 8])
 
-    x1, x2, y1, y2 = split_data(X, y, problem_type='binary')
+    x1, x2, y1, y2 = split_data(X, y, problem_type='regression')
     tp = MyTargetPipeline({})
     tp.fit(x2, y2)
diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index 00dc664431..60fc9b2917 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -3,7 +3,12 @@
 import numpy as np
 import pandas as pd
 import pytest
-from pandas.testing import assert_frame_equal
+import woodwork as ww
+from pandas.testing import (
+    assert_frame_equal,
+    assert_index_equal,
+    assert_series_equal
+)
 
 from evalml.exceptions import MissingComponentError
 from evalml.pipelines import ComponentGraph
@@ -352,19 +357,20 @@ def test_fit(mock_predict, mock_fit, mock_fit_transform, example_graph, X_y_bina
 
 @patch('evalml.pipelines.components.Imputer.fit_transform')
 @patch('evalml.pipelines.components.OneHotEncoder.transform')
-def test_fit_correct_inputs(mock_transform, mock_fit_transform, X_y_binary):
+def test_fit_correct_inputs(mock_ohe_transform, mock_imputer_fit_transform, X_y_binary):
     X, y = X_y_binary
     X = pd.DataFrame(X)
     y = pd.Series(y)
     graph = {'Imputer': [Imputer], 'OHE': [OneHotEncoder, 'Imputer.x', 'Imputer.y']}
-    expected_x = pd.DataFrame(index=X.index, columns=X.index).fillna(1)
-    expected_y = pd.Series(index=y.index).fillna(0)
-    mock_fit_transform.return_value = tuple((expected_x, expected_y))
+    expected_x = ww.DataTable(pd.DataFrame(index=X.index, columns=X.index).fillna(1))
+    expected_y = ww.DataColumn(pd.Series(index=y.index).fillna(0))
+    mock_imputer_fit_transform.return_value = tuple((expected_x, expected_y))
+    mock_ohe_transform.return_value = expected_x
     component_graph = ComponentGraph(graph).instantiate({})
     component_graph.fit(X, y)
-
-    pd.testing.assert_frame_equal(mock_transform.call_args[0][0], expected_x)
-    pd.testing.assert_series_equal(mock_transform.call_args[0][1], expected_y)
+    ### TODO
+    assert_frame_equal(mock_ohe_transform.call_args[0][0], expected_x.to_dataframe())
+    assert_series_equal(mock_ohe_transform.call_args[0][1].to_series(), expected_y.to_series())
 
 
 @patch('evalml.pipelines.components.Transformer.fit_transform')
@@ -376,10 +382,10 @@ def test_fit_features(mock_predict, mock_fit, mock_fit_transform, X_y_binary):
     component_graph = ComponentGraph.from_list(component_list)
     component_graph.instantiate({})
 
-    mock_X_t = pd.DataFrame(np.ones(pd.DataFrame(X).shape))
-    mock_fit_transform.return_value = mock_X_t
+    mock_X_t = pd.DataFrame(np.ones(X.shape))
+    mock_fit_transform.return_value = ww.DataTable(mock_X_t)
     mock_fit.return_value = Estimator
-    mock_predict.return_value = pd.Series(y)
+    mock_predict.return_value = ww.DataColumn(y)
 
     component_graph.fit_features(X, y)
 
@@ -396,10 +402,10 @@ def test_fit_features_nonlinear(mock_predict, mock_fit, mock_fit_transform, exam
     component_graph = ComponentGraph(example_graph)
     component_graph.instantiate({})
 
-    mock_X_t = pd.DataFrame(np.ones(pd.DataFrame(X).shape))
+    mock_X_t = ww.DataTable(np.ones(pd.DataFrame(X).shape))
     mock_fit_transform.return_value = mock_X_t
     mock_fit.return_value = Estimator
-    mock_predict.return_value = pd.Series(y)
+    mock_predict.return_value = ww.DataColumn(pd.Series(y))
 
     component_graph.fit_features(X, y)
 
@@ -450,8 +456,8 @@ def test_compute_final_component_features_linear(mock_ohe, mock_imputer, X_y_bin
     X, y = X_y_binary
     X = pd.DataFrame(X)
     X_expected = pd.DataFrame(index=X.index, columns=X.columns).fillna(0)
-    mock_imputer.return_value = X
-    mock_ohe.return_value = X_expected
+    mock_imputer.return_value = ww.DataTable(X)
+    mock_ohe.return_value = ww.DataTable(X_expected)
 
     component_list = ['Imputer', 'One Hot Encoder', 'Random Forest Classifier']
     component_graph = ComponentGraph().from_list(component_list)
@@ -459,7 +465,7 @@ def test_compute_final_component_features_linear(mock_ohe, mock_imputer, X_y_bin
     component_graph.fit(X, y)
 
     X_t = component_graph.compute_final_component_features(X)
-    assert_frame_equal(X_t, X_expected)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
     assert mock_imputer.call_count == 2
     assert mock_ohe.call_count == 2
 
@@ -488,12 +494,12 @@ def test_compute_final_component_features_nonlinear(mock_en_predict, mock_rf_pre
 def test_compute_final_component_features_single_component(mock_transform, X_y_binary):
     X, y = X_y_binary
     X = pd.DataFrame(X)
-    mock_transform.return_value = pd.DataFrame()
+    mock_transform.return_value = ww.DataTable(X)
     component_graph = ComponentGraph({'Dummy Component': [DummyTransformer]}).instantiate({})
     component_graph.fit(X, y)
 
     X_t = component_graph.compute_final_component_features(X)
-    assert_frame_equal(X, X_t.to_dataframe())
+    assert_frame_equal(X, X_t)
 
 
 @patch('evalml.pipelines.components.Imputer.fit_transform')
@@ -517,7 +523,7 @@ def test_predict_empty_graph(X_y_binary):
 
     component_graph.fit(X, y)
     X_t = component_graph.predict(X)
-    pd.testing.assert_frame_equal(X_t, X)
+    assert_frame_equal(X_t, X)
 
 
 @patch('evalml.pipelines.components.OneHotEncoder.fit_transform')
@@ -532,7 +538,7 @@ def test_predict_transformer_end(mock_fit_transform, mock_transform, X_y_binary)
     component_graph.fit(X, y)
     output = component_graph.predict(X)
 
-    pd.testing.assert_frame_equal(output, pd.DataFrame(X))
+    assert_frame_equal(output, pd.DataFrame(X))
 
 
 def test_no_instantiate_before_fit(X_y_binary):
@@ -585,8 +591,8 @@ def test_computation_input_custom_index(index):
     component_graph.instantiate({})
     component_graph.fit(X, y)
 
-    X_t = component_graph.predict(X)
-    pd.testing.assert_index_equal(X_t.index, pd.RangeIndex(start=0, stop=5, step=1))
+    X_t = component_graph.predict(X).to_series()
+    assert_index_equal(X_t.index, pd.RangeIndex(start=0, stop=5, step=1))
     assert not X_t.isna().any(axis=None)
 
 
@@ -619,13 +625,13 @@ def test_component_graph_evaluation_plumbing(mock_transa, mock_transb, mock_tran
     component_graph.fit(X, y)
     predict_out = component_graph.predict(X)
 
-    pd.testing.assert_frame_equal(mock_transa.call_args[0][0], X)
-    pd.testing.assert_frame_equal(mock_transb.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6)}, columns=['feature trans', 'feature a']))
-    pd.testing.assert_frame_equal(mock_transc.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6), 'feature b': np.ones(6) * 2}, columns=['feature trans', 'feature a', 'feature b']))
-    pd.testing.assert_frame_equal(mock_preda.call_args[0][0], X)
-    pd.testing.assert_frame_equal(mock_predb.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6)}, columns=['feature trans', 'feature a']))
-    pd.testing.assert_frame_equal(mock_predc.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6), 'estimator a': [0, 0, 0, 1, 0, 0], 'feature b': np.ones(6) * 2, 'estimator b': [0, 0, 0, 0, 1, 0], 'feature c': np.ones(6) * 3}, columns=['feature trans', 'feature a', 'estimator a', 'feature b', 'estimator b', 'feature c']))
-    pd.testing.assert_series_equal(predict_out, pd.Series([0, 0, 0, 0, 0, 1]))
+    assert_frame_equal(mock_transa.call_args[0][0], X)
+    assert_frame_equal(mock_transb.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6)}, columns=['feature trans', 'feature a']))
+    assert_frame_equal(mock_transc.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6), 'feature b': np.ones(6) * 2}, columns=['feature trans', 'feature a', 'feature b']))
+    assert_frame_equal(mock_preda.call_args[0][0], X)
+    assert_frame_equal(mock_predb.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6)}, columns=['feature trans', 'feature a']))
+    assert_frame_equal(mock_predc.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6), 'estimator a': [0, 0, 0, 1, 0, 0], 'feature b': np.ones(6) * 2, 'estimator b': [0, 0, 0, 0, 1, 0], 'feature c': np.ones(6) * 3}, columns=['feature trans', 'feature a', 'estimator a', 'feature b', 'estimator b', 'feature c']))
+    assert_series_equal(predict_out, pd.Series([0, 0, 0, 0, 0, 1]))
 
 
 def test_input_feature_names(example_graph):

From bb10ab15027fccd8587af506e6eb1153d24167c1 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 00:18:14 -0500
Subject: [PATCH 28/98] fix time series pipeline tests

---
 evalml/objectives/objective_base.py           |  1 +
 evalml/pipelines/component_graph.py           |  5 ++-
 evalml/pipelines/pipeline_base.py             |  3 ++
 .../time_series_classification_pipelines.py   | 26 +++++++++++----
 .../time_series_regression_pipeline.py        |  2 ++
 .../test_time_series_pipeline.py              | 33 ++++++++++---------
 evalml/utils/gen_utils.py                     |  1 -
 7 files changed, 47 insertions(+), 24 deletions(-)

diff --git a/evalml/objectives/objective_base.py b/evalml/objectives/objective_base.py
index 4d004676b7..ec0d634e08 100644
--- a/evalml/objectives/objective_base.py
+++ b/evalml/objectives/objective_base.py
@@ -114,6 +114,7 @@ def validate_inputs(self, y_true, y_predicted):
             raise ValueError("y_true contains NaN or infinity")
         # y_predicted could be a 1d vector (predictions) or a 2d vector (classifier predicted probabilities)
         y_pred_flat = y_predicted.to_numpy().flatten()
+
         if np.isnan(y_pred_flat).any() or np.isinf(y_pred_flat).any():
             raise ValueError("y_predicted contains NaN or infinity")
         if self.score_needs_proba and np.any([(y_pred_flat < 0) | (y_pred_flat > 1)]):
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 8c6991e16c..b5e6b94e55 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -100,9 +100,12 @@ def fit_features(self, X, y):
         Arguments:
             X (pd.DataFrame): The input training data of shape [n_samples, n_features]
             y (pd.Series): The target training data of length [n_samples]
+        
+        Returns:
+            ww.DataTable
         """
         if len(self.compute_order) <= 1:
-            return X
+            return _convert_to_woodwork_structure(X)
 
         component_outputs = self._compute_features(self.compute_order[:-1], X, y=y, fit=True)
         final_component_inputs = []
diff --git a/evalml/pipelines/pipeline_base.py b/evalml/pipelines/pipeline_base.py
index 6dd7b9436a..ef53a48221 100644
--- a/evalml/pipelines/pipeline_base.py
+++ b/evalml/pipelines/pipeline_base.py
@@ -258,6 +258,9 @@ def _score_all_objectives(self, X, y, y_pred, y_pred_proba, objectives):
             y_pred_proba (pd.Dataframe, pd.Series, None): The predicted probabilities for classification problems.
                 Will be a DataFrame for multiclass problems and Series otherwise. Will be None for regression problems.
             objectives (list): List of objectives to score.
+        
+        Returns:
+            Ordered dictionary with objectives and their scores.
         """
         scored_successfully = OrderedDict()
         exceptions = OrderedDict()
diff --git a/evalml/pipelines/time_series_classification_pipelines.py b/evalml/pipelines/time_series_classification_pipelines.py
index 759d6df684..19ae8c1511 100644
--- a/evalml/pipelines/time_series_classification_pipelines.py
+++ b/evalml/pipelines/time_series_classification_pipelines.py
@@ -59,7 +59,6 @@ def fit(self, X, y):
         y = _convert_woodwork_types_wrapper(y.to_series())
         self._encoder.fit(y)
         y = self._encode_targets(y)
-
         X_t = self._compute_features_during_fit(X, y)
         X_t = _convert_woodwork_types_wrapper(X_t.to_dataframe())
         y_shifted = y.shift(-self.gap)
@@ -85,6 +84,7 @@ def _estimator_predict_proba(self, features, y):
         y_arg = None
         if self.estimator.predict_uses_y:
             y_arg = y
+
         return self.estimator.predict_proba(features, y=y_arg)
 
     def _predict(self, X, y, objective=None, pad=False):
@@ -98,8 +98,10 @@ def _predict(self, X, y, objective=None, pad=False):
         # features = _convert_woodwork_types_wrapper(features.to_series())
         features_no_nan, y_encoded = drop_rows_with_nans(features, y_encoded)
         predictions = self._estimator_predict(features_no_nan, y_encoded)
+        # predictions = predictions.to_series()
         if pad:
-            return pad_with_nans(predictions, max(0, features.shape[0] - predictions.shape[0]))
+            padded = pad_with_nans(predictions.to_series(), max(0, features.shape[0] - predictions.shape[0]))
+            return _convert_to_woodwork_structure(padded)
         return predictions
 
     def predict(self, X, y=None, objective=None):
@@ -141,8 +143,13 @@ def predict_proba(self, X, y=None):
         y = _convert_woodwork_types_wrapper(y.to_series())
         y_encoded = self._encode_targets(y)
         features = self.compute_estimator_features(X, y_encoded)
+        if isinstance(features, ww.DataTable):
+            features = _convert_woodwork_types_wrapper(features.to_dataframe())
+        elif isinstance(features, ww.DataColumn):
+            features = _convert_woodwork_types_wrapper(features.to_series())
         features_no_nan, y_encoded = drop_rows_with_nans(features, y_encoded)
         proba = self._estimator_predict_proba(features_no_nan, y_encoded)
+        proba = proba.to_dataframe()
         proba.columns = self._encoder.classes_
         padded = pad_with_nans(proba, max(0, features.shape[0] - proba.shape[0]))
         return _convert_to_woodwork_structure(padded)
@@ -155,6 +162,12 @@ def _compute_predictions(self, X, y, objectives):
             y_predicted_proba = self.predict_proba(X, y)
         if any(not o.score_needs_proba for o in objectives):
             y_predicted = self._predict(X, y, pad=True)
+
+        if isinstance(y_predicted_proba, ww.DataTable):
+            y_predicted_proba = _convert_woodwork_types_wrapper(y_predicted_proba.to_dataframe())
+
+        if isinstance(y_predicted, ww.DataColumn):
+            y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
         return y_predicted, y_predicted_proba
 
     def score(self, X, y, objectives):
@@ -210,17 +223,18 @@ def _predict(self, X, y, objective=None, pad=False):
                 raise ValueError(f"Objective {objective.name} is not defined for time series binary classification.")
 
         if self.threshold is None:
-            predictions = self._estimator_predict(features_no_nan, y_encoded)
+            predictions = self._estimator_predict(features_no_nan, y_encoded).to_series()
         else:
-            proba = self._estimator_predict_proba(features_no_nan, y_encoded)
+            proba = self._estimator_predict_proba(features_no_nan, y_encoded).to_dataframe()
             proba = proba.iloc[:, 1]
             if objective is None:
                 predictions = proba > self.threshold
             else:
                 predictions = objective.decision_function(proba, threshold=self.threshold, X=features_no_nan)
         if pad:
-            return pad_with_nans(predictions, max(0, features.shape[0] - predictions.shape[0]))
-        return predictions
+            padded = pad_with_nans(predictions, max(0, features.shape[0] - predictions.shape[0]))
+            return _convert_to_woodwork_structure(padded)
+        return _convert_to_woodwork_structure(predictions)
 
     @staticmethod
     def _score(X, y, predictions, objective):
diff --git a/evalml/pipelines/time_series_regression_pipeline.py b/evalml/pipelines/time_series_regression_pipeline.py
index 6996481ae2..8c86ed9519 100644
--- a/evalml/pipelines/time_series_regression_pipeline.py
+++ b/evalml/pipelines/time_series_regression_pipeline.py
@@ -116,6 +116,8 @@ def score(self, X, y, objectives):
         y = _convert_woodwork_types_wrapper(y.to_series())
 
         y_predicted = self.predict(X, y)
+        y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
+
         y_shifted = y.shift(-self.gap)
         objectives = [get_objective(o, return_instance=True) for o in objectives]
         y_shifted, y_predicted = drop_rows_with_nans(y_shifted, y_predicted)
diff --git a/evalml/tests/pipeline_tests/test_time_series_pipeline.py b/evalml/tests/pipeline_tests/test_time_series_pipeline.py
index 8b4d2f675d..8b0048c96e 100644
--- a/evalml/tests/pipeline_tests/test_time_series_pipeline.py
+++ b/evalml/tests/pipeline_tests/test_time_series_pipeline.py
@@ -125,7 +125,7 @@ class Pipeline(pipeline_class):
                    "pipeline": {"gap": gap, "max_delay": max_delay}})
 
     def mock_predict(df, y=None):
-        return pd.Series(range(200, 200 + df.shape[0]))
+        return ww.DataColumn(pd.Series(range(200, 200 + df.shape[0])))
 
     if isinstance(pl, TimeSeriesRegressionPipeline):
         mock_regressor_predict.side_effect = mock_predict
@@ -141,9 +141,9 @@ def mock_predict(df, y=None):
 
     # Check that the predictions have NaNs for the first n_delay dates
     if include_delayed_features:
-        assert np.isnan(preds.values[:max_delay]).all()
+        assert np.isnan(preds.to_series().values[:max_delay]).all()
     else:
-        assert not np.isnan(preds.values).any()
+        assert not np.isnan(preds.to_series().values).any()
 
 
 @pytest.mark.parametrize("only_use_y", [True, False])
@@ -184,8 +184,8 @@ class Pipeline(pipeline_class):
                                                    "delay_target": include_delayed_features},
                    "pipeline": {"gap": gap, "max_delay": max_delay}})
 
-    def mock_predict(df, y=None):
-        return pd.Series(range(200, 200 + df.shape[0]))
+    def mock_predict(X, y=None):
+        return ww.DataColumn(pd.Series(range(200, 200 + X.shape[0])))
 
     if isinstance(pl, TimeSeriesRegressionPipeline):
         mock_regressor_predict.side_effect = mock_predict
@@ -216,7 +216,7 @@ def mock_predict(df, y=None):
 def test_classification_pipeline_encodes_targets(mock_score, mock_predict, mock_fit, pipeline_class, X_y_binary):
     X, y = X_y_binary
     y_series = pd.Series(y)
-    mock_predict.return_value = y_series
+    mock_predict.return_value = ww.DataColumn(y_series)
     X = pd.DataFrame({"feature": range(len(y))})
     y_encoded = y_series.map(lambda label: "positive" if label == 1 else "negative")
 
@@ -267,13 +267,13 @@ def fit(self, X, y):
         """No op."""
 
     def predict(self, X, y):
-        return y
+        return ww.DataColumn(y)
 
     def predict_proba(self, X, y):
         n_classes = len(y.value_counts())
         mode_index = 0
         proba_arr = np.array([[1.0 if i == mode_index else 0.0 for i in range(n_classes)]] * len(y))
-        return pd.DataFrame(proba_arr)
+        return ww.DataTable(pd.DataFrame(proba_arr))
 
 
 @pytest.mark.parametrize("pipeline_class,objectives", [(TimeSeriesBinaryClassificationPipeline, ["MCC Binary"]),
@@ -285,7 +285,7 @@ def predict_proba(self, X, y):
                                                        (TimeSeriesRegressionPipeline, ['R2']),
                                                        (TimeSeriesRegressionPipeline, ['R2', "Mean Absolute Percentage Error"])])
 @pytest.mark.parametrize("use_ww", [True, False])
-def test_score_works(pipeline_class, objectives, use_ww, X_y_binary, X_y_multi, X_y_regression):
+def test_score_works(pipeline_class, objectives, use_ww, X_y_binary, X_y_multi, X_y_regression, make_data_type):
 
     preprocessing = ['Delayed Feature Transformer']
     if pipeline_class == TimeSeriesRegressionPipeline:
@@ -312,13 +312,13 @@ class Pipeline(pipeline_class):
         y = pd.Series(y)
         expected_unique_values = None
     if use_ww:
-        X = ww.DataTable(X)
-        y = ww.DataColumn(y)
+        X = make_data_type("ww", X)
+        y = make_data_type("ww", y)
 
     pl.fit(X, y)
     if expected_unique_values:
         # NaNs are expected because of padding due to max_delay
-        assert set(pl.predict(X, y).dropna().unique()) == expected_unique_values
+        assert set(pl.predict(X, y).to_series().dropna().unique()) == expected_unique_values
     pl.score(X, y, objectives)
 
 
@@ -348,14 +348,14 @@ class Pipeline(pipeline_class):
 
     pl.fit(X, y)
     # NaNs are expected because of padding due to max_delay
-    assert set(pl.predict(X, y).dropna().unique()) == expected_unique_values
+    assert set(pl.predict(X, y).to_series().dropna().unique()) == expected_unique_values
     pl.score(X, y, objectives)
 
 
 @patch('evalml.pipelines.TimeSeriesClassificationPipeline._decode_targets')
 @patch('evalml.objectives.BinaryClassificationObjective.decision_function')
-@patch('evalml.pipelines.components.Estimator.predict_proba', return_value=pd.DataFrame({0: [1.]}))
-@patch('evalml.pipelines.components.Estimator.predict', return_value=pd.Series([1.]))
+@patch('evalml.pipelines.components.Estimator.predict_proba', return_value=ww.DataTable(pd.DataFrame({0: [1.]})))
+@patch('evalml.pipelines.components.Estimator.predict', return_value=ww.DataColumn(pd.Series([1.])))
 def test_binary_classification_predictions_thresholded_properly(mock_predict, mock_predict_proba,
                                                                 mock_obj_decision, mock_decode,
                                                                 X_y_binary, dummy_ts_binary_pipeline_class):
@@ -379,7 +379,7 @@ def test_binary_classification_predictions_thresholded_properly(mock_predict, mo
 
     mock_objs = [mock_decode, mock_predict_proba]
     # test custom threshold set but no objective passed
-    mock_predict_proba.return_value = pd.DataFrame([[0.1, 0.2], [0.1, 0.2]])
+    mock_predict_proba.return_value = ww.DataTable(pd.DataFrame([[0.1, 0.2], [0.1, 0.2]]))
     binary_pipeline.threshold = 0.6
     binary_pipeline._encoder.classes_ = [0, 1]
     binary_pipeline.predict(X, y)
@@ -400,6 +400,7 @@ def test_binary_classification_predictions_thresholded_properly(mock_predict, mo
 
     # test custom threshold set and objective passed
     binary_pipeline.threshold = 0.6
+    mock_obj_decision.return_value = pd.Series([1.])
     binary_pipeline.predict(X, y, 'precision')
     for mock_obj in mock_objs:
         mock_obj.assert_called()
diff --git a/evalml/utils/gen_utils.py b/evalml/utils/gen_utils.py
index da0cca4f48..8e54c5ff84 100644
--- a/evalml/utils/gen_utils.py
+++ b/evalml/utils/gen_utils.py
@@ -338,7 +338,6 @@ def _convert_woodwork_types_wrapper(pd_data):
     nullable_to_numpy_mapping_nan = {pd.Int64Dtype: 'float64',
                                      pd.BooleanDtype: 'object',
                                      pd.StringDtype: 'object'}
-
     if isinstance(pd_data, pd.api.extensions.ExtensionArray):
         if pd.isna(pd_data).any():
             return pd.Series(pd_data.to_numpy(na_value=np.nan), dtype=nullable_to_numpy_mapping_nan[type(pd_data.dtype)])

From 8699d374c78aecc2643a509073c188040f4ba091 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 02:01:06 -0500
Subject: [PATCH 29/98] fix more component tests

---
 .../classifiers/lightgbm_classifier.py        |  2 +-
 .../test_decision_tree_classifier.py          |  8 ++---
 .../test_decision_tree_regressor.py           |  2 +-
 .../component_tests/test_en_classifier.py     |  8 ++---
 .../component_tests/test_en_regressor.py      |  2 +-
 .../component_tests/test_et_classifier.py     |  8 ++---
 .../component_tests/test_et_regressor.py      |  2 +-
 .../component_tests/test_lgbm_classifier.py   | 33 ++++++++++---------
 .../component_tests/test_lgbm_regressor.py    |  4 +--
 9 files changed, 35 insertions(+), 34 deletions(-)

diff --git a/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py b/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py
index 3159f80385..cf8dfd9e31 100644
--- a/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py
@@ -106,7 +106,7 @@ def fit(self, X, y=None):
 
     def predict(self, X):
         X_encoded = self._encode_categories(X)
-        predictions = super().predict(X_encoded)
+        predictions = super().predict(X_encoded).to_series()
         if self._label_encoder:
             predictions = pd.Series(self._label_encoder.inverse_transform(predictions.astype(np.int64)))
         return _convert_to_woodwork_structure(predictions)
diff --git a/evalml/tests/component_tests/test_decision_tree_classifier.py b/evalml/tests/component_tests/test_decision_tree_classifier.py
index d524ec918b..91d9ee8398 100644
--- a/evalml/tests/component_tests/test_decision_tree_classifier.py
+++ b/evalml/tests/component_tests/test_decision_tree_classifier.py
@@ -29,8 +29,8 @@ def test_fit_predict_binary(X_y_binary):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe().values, decimal=5)
 
 
 def test_fit_predict_multi(X_y_multi):
@@ -46,8 +46,8 @@ def test_fit_predict_multi(X_y_multi):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe().values, decimal=5)
 
 
 def test_feature_importance(X_y_binary):
diff --git a/evalml/tests/component_tests/test_decision_tree_regressor.py b/evalml/tests/component_tests/test_decision_tree_regressor.py
index 57ae041b09..e65f04af9c 100644
--- a/evalml/tests/component_tests/test_decision_tree_regressor.py
+++ b/evalml/tests/component_tests/test_decision_tree_regressor.py
@@ -26,7 +26,7 @@ def test_fit_predict(X_y_regression):
     clf.fit(X, y)
     y_pred = clf.predict(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
 
 
 def test_feature_importance(X_y_regression):
diff --git a/evalml/tests/component_tests/test_en_classifier.py b/evalml/tests/component_tests/test_en_classifier.py
index 1dc453a507..28780c845d 100644
--- a/evalml/tests/component_tests/test_en_classifier.py
+++ b/evalml/tests/component_tests/test_en_classifier.py
@@ -37,8 +37,8 @@ def test_fit_predict_binary(X_y_binary):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe().values, decimal=5)
 
 
 def test_fit_predict_multi(X_y_multi):
@@ -59,8 +59,8 @@ def test_fit_predict_multi(X_y_multi):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe().values, decimal=5)
 
 
 def test_feature_importance(X_y_binary):
diff --git a/evalml/tests/component_tests/test_en_regressor.py b/evalml/tests/component_tests/test_en_regressor.py
index 7973ca2078..22f1a1825a 100644
--- a/evalml/tests/component_tests/test_en_regressor.py
+++ b/evalml/tests/component_tests/test_en_regressor.py
@@ -43,7 +43,7 @@ def test_fit_predict(X_y_regression):
     clf.fit(X, y)
     y_pred = clf.predict(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
 
 
 def test_feature_importance(X_y_regression):
diff --git a/evalml/tests/component_tests/test_et_classifier.py b/evalml/tests/component_tests/test_et_classifier.py
index 91b7686512..37cb0678fe 100644
--- a/evalml/tests/component_tests/test_et_classifier.py
+++ b/evalml/tests/component_tests/test_et_classifier.py
@@ -29,8 +29,8 @@ def test_fit_predict_binary(X_y_binary):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe().values, decimal=5)
 
 
 def test_fit_predict_multi(X_y_multi):
@@ -46,8 +46,8 @@ def test_fit_predict_multi(X_y_multi):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe().values, decimal=5)
 
 
 def test_feature_importance(X_y_binary):
diff --git a/evalml/tests/component_tests/test_et_regressor.py b/evalml/tests/component_tests/test_et_regressor.py
index 7a6e88ca7f..f4813d5dfc 100644
--- a/evalml/tests/component_tests/test_et_regressor.py
+++ b/evalml/tests/component_tests/test_et_regressor.py
@@ -26,7 +26,7 @@ def test_fit_predict(X_y_regression):
     clf.fit(X, y)
     y_pred = clf.predict(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
 
 
 def test_feature_importance(X_y_regression):
diff --git a/evalml/tests/component_tests/test_lgbm_classifier.py b/evalml/tests/component_tests/test_lgbm_classifier.py
index 747aa3aa76..8a92144000 100644
--- a/evalml/tests/component_tests/test_lgbm_classifier.py
+++ b/evalml/tests/component_tests/test_lgbm_classifier.py
@@ -3,6 +3,7 @@
 import numpy as np
 import pandas as pd
 import pytest
+import woodwork as ww
 from pandas.testing import assert_frame_equal, assert_series_equal
 from pytest import importorskip
 
@@ -72,8 +73,8 @@ def test_fit_predict_binary(X_y_binary):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe().values, decimal=5)
 
 
 def test_fit_predict_multi(X_y_multi):
@@ -89,8 +90,8 @@ def test_fit_predict_multi(X_y_multi):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe().values, decimal=5)
 
 
 def test_feature_importance(X_y_binary):
@@ -126,12 +127,12 @@ def test_fit_string_features(X_y_binary):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe().values, decimal=5)
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba')
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba', return_value=ww.DataTable(pd.DataFrame()))
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_fit_no_categories(mock_fit, mock_predict, mock_predict_proba, X_y_binary):
     X, y = X_y_binary
@@ -151,8 +152,8 @@ def test_fit_no_categories(mock_fit, mock_predict, mock_predict_proba, X_y_binar
     np.testing.assert_array_equal(arg_X, X2)
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba')
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba', return_value=ww.DataTable(pd.DataFrame()))
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_correct_args(mock_fit, mock_predict, mock_predict_proba, X_y_binary):
     X, y = X_y_binary
@@ -188,8 +189,8 @@ def test_correct_args(mock_fit, mock_predict, mock_predict_proba, X_y_binary):
     assert_frame_equal(X_expected, arg_X)
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba')
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba', return_value=ww.DataTable(pd.DataFrame()))
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_categorical_data_subset(mock_fit, mock_predict, mock_predict_proba, X_y_binary):
     X = pd.DataFrame({"feature_1": [0, 0, 1, 1, 0, 1], "feature_2": ["a", "a", "b", "b", "c", "c"]})
@@ -216,8 +217,8 @@ def test_categorical_data_subset(mock_fit, mock_predict, mock_predict_proba, X_y
     assert_frame_equal(X_expected_subset, arg_X)
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba')
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba', return_value=ww.DataTable(pd.DataFrame()))
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_multiple_fit(mock_fit, mock_predict, mock_predict_proba):
     y = pd.Series([1] * 4)
@@ -249,7 +250,7 @@ def test_multiple_fit(mock_fit, mock_predict, mock_predict_proba):
     assert_frame_equal(X2_predict_expected, mock_predict_proba.call_args[0][0])
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_multiclass_label(mock_fit, mock_predict, X_y_multi):
     X, y = X_y_multi
@@ -264,7 +265,7 @@ def test_multiclass_label(mock_fit, mock_predict, X_y_multi):
     clf.predict(X)
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_binary_label_encoding(mock_fit, mock_predict, X_y_binary):
     X, y = X_y_binary
diff --git a/evalml/tests/component_tests/test_lgbm_regressor.py b/evalml/tests/component_tests/test_lgbm_regressor.py
index f6d43b4591..55316de9c6 100644
--- a/evalml/tests/component_tests/test_lgbm_regressor.py
+++ b/evalml/tests/component_tests/test_lgbm_regressor.py
@@ -68,7 +68,7 @@ def test_fit_predict_regression(X_y_regression):
     clf.fit(X, y)
     y_pred = clf.predict(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=3)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
 
 
 def test_feature_importance(X_y_regression):
@@ -102,7 +102,7 @@ def test_fit_string_features(X_y_regression):
     clf.fit(X, y)
     y_pred = clf.predict(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=3)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series().values, decimal=5)
 
 
 @patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')

From 94e46557bf56ec8815404f88c44b916d5f9d1ebf Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 13:45:15 -0500
Subject: [PATCH 30/98] fix some more tests

---
 evalml/pipelines/pipeline_base.py                      |  2 +-
 evalml/tests/component_tests/test_simple_imputer.py    | 10 ++++------
 evalml/tests/component_tests/test_xgboost_regressor.py |  2 +-
 3 files changed, 6 insertions(+), 8 deletions(-)

diff --git a/evalml/pipelines/pipeline_base.py b/evalml/pipelines/pipeline_base.py
index ef53a48221..2a380a5ea6 100644
--- a/evalml/pipelines/pipeline_base.py
+++ b/evalml/pipelines/pipeline_base.py
@@ -258,7 +258,7 @@ def _score_all_objectives(self, X, y, y_pred, y_pred_proba, objectives):
             y_pred_proba (pd.Dataframe, pd.Series, None): The predicted probabilities for classification problems.
                 Will be a DataFrame for multiclass problems and Series otherwise. Will be None for regression problems.
             objectives (list): List of objectives to score.
-        
+
         Returns:
             Ordered dictionary with objectives and their scores.
         """
diff --git a/evalml/tests/component_tests/test_simple_imputer.py b/evalml/tests/component_tests/test_simple_imputer.py
index 8ac32704f2..1ac31cefdf 100644
--- a/evalml/tests/component_tests/test_simple_imputer.py
+++ b/evalml/tests/component_tests/test_simple_imputer.py
@@ -234,24 +234,22 @@ def test_simple_imputer_fill_value(data_type):
     assert_frame_equal(expected, transformed.to_dataframe(), check_dtype=False)
 
 
-def test_simple_imputer_resets_index():
+def test_simple_imputer_does_not_reset_index():
     X = pd.DataFrame({'input_val': np.arange(10), 'target': np.arange(10)})
     X.loc[5, 'input_val'] = np.nan
     assert X.index.tolist() == list(range(10))
 
     X.drop(0, inplace=True)
     y = X.pop('target')
-    pd.testing.assert_frame_equal(X,
-                                  pd.DataFrame({'input_val': [1.0, 2, 3, 4, np.nan, 6, 7, 8, 9]},
-                                               dtype=float,
-                                               index=list(range(1, 10))))
+    pd.testing.assert_frame_equal(pd.DataFrame({'input_val': [1.0, 2, 3, 4, np.nan, 6, 7, 8, 9]},
+                                               dtype=float, index=list(range(1, 10))), X)
 
     imputer = SimpleImputer(impute_strategy="mean")
     imputer.fit(X, y=y)
     transformed = imputer.transform(X)
     pd.testing.assert_frame_equal(pd.DataFrame({'input_val': [1.0, 2, 3, 4, 5, 6, 7, 8, 9]},
                                                dtype=float,
-                                               index=list(range(0, 9))),
+                                               index=list(range(1, 10))),
                                   transformed.to_dataframe())
 
 
diff --git a/evalml/tests/component_tests/test_xgboost_regressor.py b/evalml/tests/component_tests/test_xgboost_regressor.py
index 7bdbec14e5..a01d0494a4 100644
--- a/evalml/tests/component_tests/test_xgboost_regressor.py
+++ b/evalml/tests/component_tests/test_xgboost_regressor.py
@@ -54,7 +54,7 @@ def test_xgboost_feature_name_with_random_ascii(X_y_regression):
     clf.fit(X, y)
     predictions = clf.predict(X)
     assert len(predictions) == len(y)
-    assert not np.isnan(predictions).all()
+    assert not np.isnan(predictions.to_series()).all()
 
     assert len(clf.feature_importance) == len(X.columns)
     assert not np.isnan(clf.feature_importance).all().all()

From 93dcc796cf2b875d2a12bb2fa3e8980887542d45 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 14:26:28 -0500
Subject: [PATCH 31/98] fix baseline classification test

---
 .../test_baseline_classification.py           | 54 +++++++++++++------
 1 file changed, 38 insertions(+), 16 deletions(-)

diff --git a/evalml/tests/pipeline_tests/classification_pipeline_tests/test_baseline_classification.py b/evalml/tests/pipeline_tests/classification_pipeline_tests/test_baseline_classification.py
index f8dea74132..36b80aa91d 100644
--- a/evalml/tests/pipeline_tests/classification_pipeline_tests/test_baseline_classification.py
+++ b/evalml/tests/pipeline_tests/classification_pipeline_tests/test_baseline_classification.py
@@ -1,5 +1,6 @@
 import numpy as np
 import pandas as pd
+from pandas.testing import assert_frame_equal, assert_series_equal
 
 from evalml.pipelines import BaselineBinaryPipeline, BaselineMulticlassPipeline
 from evalml.utils import get_random_state
@@ -15,11 +16,14 @@ def test_baseline_binary_random(X_y_binary):
     }
     clf = BaselineBinaryPipeline(parameters=parameters)
     clf.fit(X, y)
-    predicted_proba = clf.predict_proba(X)
+    expected_predicted = pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64")
+    assert_series_equal(expected_predicted, clf.predict(X).to_series())
 
-    np.testing.assert_allclose(clf.predict(X), get_random_state(0).choice(np.unique(y), len(X)))
+    predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 2)
-    np.testing.assert_allclose(predicted_proba, np.array([[0.5 for i in range(len(values))]] * len(X)))
+    expected_predicted_proba = pd.DataFrame(np.array([[0.5 for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
 
@@ -36,11 +40,15 @@ def test_baseline_binary_random_weighted(X_y_binary):
     }
     clf = BaselineBinaryPipeline(parameters=parameters)
     clf.fit(X, y)
-    predicted_proba = clf.predict_proba(X)
 
-    np.testing.assert_allclose(clf.predict(X), get_random_state(0).choice(np.unique(y), len(X), p=percent_freq))
+    expected_predicted = pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64")
+    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+
+    expected_predicted_proba = pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
+    predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 2)
-    np.testing.assert_allclose(predicted_proba, np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
 
@@ -54,11 +62,15 @@ def test_baseline_binary_mode():
     }
     clf = BaselineBinaryPipeline(parameters=parameters)
     clf.fit(X, y)
-    np.testing.assert_allclose(clf.predict(X), np.array([10] * len(X)))
+
+    expected_predicted = pd.Series(np.array([10] * len(X)), dtype="Int64")
+    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 2)
     expected_predicted_proba = pd.DataFrame({10: [1., 1., 1., 1.], 11: [0., 0., 0., 0.]})
-    pd.testing.assert_frame_equal(expected_predicted_proba, predicted_proba)
+    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
 
@@ -72,11 +84,14 @@ def test_baseline_multi_random(X_y_multi):
     }
     clf = BaselineMulticlassPipeline(parameters=parameters)
     clf.fit(X, y)
-    predicted_proba = clf.predict_proba(X)
 
-    np.testing.assert_allclose(clf.predict(X), get_random_state(0).choice(np.unique(y), len(X)))
+    expected_predicted = pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64")
+    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+
+    predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
-    np.testing.assert_allclose(predicted_proba, np.array([[1. / 3 for i in range(len(values))]] * len(X)))
+    expected_predicted_proba = pd.DataFrame(np.array([[1. / 3 for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
 
@@ -93,11 +108,15 @@ def test_baseline_multi_random_weighted(X_y_multi):
     }
     clf = BaselineMulticlassPipeline(parameters=parameters)
     clf.fit(X, y)
-    predicted_proba = clf.predict_proba(X)
 
-    np.testing.assert_allclose(clf.predict(X), get_random_state(0).choice(np.unique(y), len(X), p=percent_freq))
+    expected_predicted = pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64")
+    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+
+    predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
-    np.testing.assert_allclose(predicted_proba, np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
+    expected_predicted_proba = pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
 
@@ -111,9 +130,12 @@ def test_baseline_multi_mode():
     }
     clf = BaselineMulticlassPipeline(parameters=parameters)
     clf.fit(X, y)
-    np.testing.assert_allclose(clf.predict(X), np.array([11] * len(X)))
+    expected_predicted = pd.Series(np.array([11] * len(X)), dtype="Int64")
+    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
     expected_predicted_proba = pd.DataFrame({10: [0., 0., 0., 0.], 11: [1., 1., 1., 1.], 12: [0., 0., 0., 0.]})
-    pd.testing.assert_frame_equal(expected_predicted_proba, predicted_proba)
+    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))

From f247141e8cf2ca90e3aa3008fc6210ccf2bf252a Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 15:59:27 -0500
Subject: [PATCH 32/98] fixing more automl and pipeline test

---
 evalml/pipelines/binary_classification_pipeline.py        | 5 +++--
 evalml/pipelines/classification_pipeline.py               | 3 +++
 evalml/pipelines/component_graph.py                       | 2 +-
 evalml/pipelines/regression_pipeline.py                   | 2 +-
 .../automl_tests/test_automl_search_classification.py     | 4 ++--
 evalml/tests/pipeline_tests/test_pipelines.py             | 8 ++++----
 6 files changed, 14 insertions(+), 10 deletions(-)

diff --git a/evalml/pipelines/binary_classification_pipeline.py b/evalml/pipelines/binary_classification_pipeline.py
index 5f7838d271..30ab750a79 100644
--- a/evalml/pipelines/binary_classification_pipeline.py
+++ b/evalml/pipelines/binary_classification_pipeline.py
@@ -1,6 +1,7 @@
 from evalml.objectives import get_objective
 from evalml.pipelines.classification_pipeline import ClassificationPipeline
 from evalml.problem_types import ProblemTypes
+from evalml.utils import _convert_to_woodwork_structure
 
 
 class BinaryClassificationPipeline(ClassificationPipeline):
@@ -39,8 +40,8 @@ def _predict(self, X, objective=None):
         ypred_proba = ypred_proba.to_dataframe()
         ypred_proba = ypred_proba.iloc[:, 1]
         if objective is None:
-            return ypred_proba > self.threshold
-        return objective.decision_function(ypred_proba, threshold=self.threshold, X=X)
+            return _convert_to_woodwork_structure(ypred_proba > self.threshold)
+        return _convert_to_woodwork_structure(objective.decision_function(ypred_proba, threshold=self.threshold, X=X))
 
     def predict_proba(self, X):
         """Make probability estimates for labels. Assumes that the column at index 1 represents the positive label case.
diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index 3ce7631ddf..252b43f812 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -78,6 +78,8 @@ def _predict(self, X, objective=None):
         Returns:
             pd.Series: Estimated labels
         """
+        # why does this not use objectives... because multiclass doesnt? so maybe this should be moved for less confusion
+        # import pdb; pdb.set_trace()
         return self._component_graph.predict(X)
 
     def predict(self, X, objective=None):
@@ -90,6 +92,7 @@ def predict(self, X, objective=None):
         Returns:
             pd.Series : Estimated labels
         """
+        # import pdb; pdb.set_trace()
         predictions = self._predict(X, objective)
         predictions = predictions.to_series()
         predictions = pd.Series(self._decode_targets(predictions), name=self.input_target_name)
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index b5e6b94e55..818ac4fd6c 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -137,7 +137,7 @@ def predict(self, X):
             return X
         final_component = self.compute_order[-1]
         outputs = self._compute_features(self.compute_order, X)
-        return outputs.get(final_component, outputs.get(f'{final_component}.x'))
+        return _convert_to_woodwork_structure(outputs.get(final_component, outputs.get(f'{final_component}.x')))
 
     def compute_final_component_features(self, X, y=None):
         ### TODO: COMBINE WITH fit_features
diff --git a/evalml/pipelines/regression_pipeline.py b/evalml/pipelines/regression_pipeline.py
index 342a32011c..ad3d600d7c 100644
--- a/evalml/pipelines/regression_pipeline.py
+++ b/evalml/pipelines/regression_pipeline.py
@@ -43,5 +43,5 @@ def score(self, X, y, objectives):
             dict: Ordered dictionary of objective scores
         """
         objectives = [get_objective(o, return_instance=True) for o in objectives]
-        y_predicted = self.predict(X).to_series()
+        y_predicted = _convert_woodwork_types_wrapper(self.predict(X).to_series())
         return self._score_all_objectives(X, y, y_predicted, y_pred_proba=None, objectives=objectives)
diff --git a/evalml/tests/automl_tests/test_automl_search_classification.py b/evalml/tests/automl_tests/test_automl_search_classification.py
index 60c85148b1..96938e0ef7 100644
--- a/evalml/tests/automl_tests/test_automl_search_classification.py
+++ b/evalml/tests/automl_tests/test_automl_search_classification.py
@@ -117,7 +117,7 @@ def test_binary_auto(X_y_binary):
     best_pipeline = automl.best_pipeline
     assert best_pipeline._is_fitted
     y_pred = best_pipeline.predict(X)
-    assert len(np.unique(y_pred)) == 2
+    assert len(np.unique(y_pred.to_series())) == 2
 
 
 def test_multi_auto(X_y_multi, multiclass_core_objectives):
@@ -128,7 +128,7 @@ def test_multi_auto(X_y_multi, multiclass_core_objectives):
     best_pipeline = automl.best_pipeline
     assert best_pipeline._is_fitted
     y_pred = best_pipeline.predict(X)
-    assert len(np.unique(y_pred)) == 3
+    assert len(np.unique(y_pred.to_series())) == 3
 
     objective_in_additional_objectives = next((obj for obj in multiclass_core_objectives if obj.name == objective.name), None)
     multiclass_core_objectives.remove(objective_in_additional_objectives)
diff --git a/evalml/tests/pipeline_tests/test_pipelines.py b/evalml/tests/pipeline_tests/test_pipelines.py
index d375aaa799..91cc81cfc5 100644
--- a/evalml/tests/pipeline_tests/test_pipelines.py
+++ b/evalml/tests/pipeline_tests/test_pipelines.py
@@ -851,7 +851,7 @@ class MockMulticlassClassificationPipeline(MulticlassClassificationPipeline):
 @patch('evalml.pipelines.RegressionPipeline.predict')
 def test_score_regression_single(mock_predict, mock_fit, X_y_regression):
     X, y = X_y_regression
-    mock_predict.return_value = y
+    mock_predict.return_value = ww.DataColumn(y)
     clf = make_mock_regression_pipeline()
     clf.fit(X, y)
     objective_names = ['r2']
@@ -864,7 +864,7 @@ def test_score_regression_single(mock_predict, mock_fit, X_y_regression):
 @patch('evalml.pipelines.RegressionPipeline.predict')
 def test_score_nonlinear_regression(mock_predict, mock_fit, nonlinear_regression_pipeline_class, X_y_regression):
     X, y = X_y_regression
-    mock_predict.return_value = y
+    mock_predict.return_value = ww.DataColumn(y)
     clf = nonlinear_regression_pipeline_class({})
     clf.fit(X, y)
     objective_names = ['r2']
@@ -926,7 +926,7 @@ def test_score_nonlinear_multiclass(mock_encode, mock_fit, mock_predict, nonline
 @patch('evalml.pipelines.RegressionPipeline.predict')
 def test_score_regression_list(mock_predict, mock_fit, X_y_binary):
     X, y = X_y_binary
-    mock_predict.return_value = y
+    mock_predict.return_value = ww.DataColumn(y)
     clf = make_mock_regression_pipeline()
     clf.fit(X, y)
     objective_names = ['r2', 'mse']
@@ -973,7 +973,7 @@ def test_score_multi_list(mock_predict, mock_fit, mock_encode, X_y_binary):
 def test_score_regression_objective_error(mock_predict, mock_fit, mock_objective_score, X_y_binary):
     mock_objective_score.side_effect = Exception('finna kabooom 💣')
     X, y = X_y_binary
-    mock_predict.return_value = y
+    mock_predict.return_value = ww.DataColumn(y)
     clf = make_mock_regression_pipeline()
     clf.fit(X, y)
     objective_names = ['r2', 'mse']

From 2e7cfe697018f4db9302b4a3ed3f89f1e2d7bcd2 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 17:07:12 -0500
Subject: [PATCH 33/98] fix time series baseline regressor tests

---
 .../component_tests/test_time_series_baseline_regressor.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/evalml/tests/component_tests/test_time_series_baseline_regressor.py b/evalml/tests/component_tests/test_time_series_baseline_regressor.py
index 7b059a2349..4fd03324c4 100644
--- a/evalml/tests/component_tests/test_time_series_baseline_regressor.py
+++ b/evalml/tests/component_tests/test_time_series_baseline_regressor.py
@@ -1,5 +1,6 @@
 import numpy as np
 import pytest
+from pandas.testing import assert_series_equal
 
 from evalml.model_family import ModelFamily
 from evalml.pipelines.components import TimeSeriesBaselineRegressor
@@ -29,7 +30,7 @@ def test_time_series_baseline(ts_data):
     clf = TimeSeriesBaselineRegressor(gap=1)
     clf.fit(X, y)
 
-    np.testing.assert_allclose(clf.predict(X, y), y)
+    assert_series_equal(y.astype("Int64"), clf.predict(X, y).to_series())
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -41,7 +42,7 @@ def test_time_series_baseline_gap_0(ts_data):
     clf = TimeSeriesBaselineRegressor(gap=0)
     clf.fit(X, y)
 
-    np.testing.assert_allclose(clf.predict(X, y), y_true)
+    assert_series_equal(y_true, clf.predict(X, y).to_series())
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -51,5 +52,5 @@ def test_time_series_baseline_no_X(ts_data):
     clf = TimeSeriesBaselineRegressor()
     clf.fit(X=None, y=y)
 
-    np.testing.assert_allclose(clf.predict(X=None, y=y), y)
+    assert_series_equal(y.astype("Int64"), clf.predict(X=None, y=y).to_series())
     np.testing.assert_allclose(clf.feature_importance, np.array([]))

From 4c2666d0b38f4f9bcad149907206fb8f3539bc33 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 17:27:54 -0500
Subject: [PATCH 34/98] fix baseline regression pipeline tests and cbm and
 component graph tests

---
 evalml/tests/objective_tests/test_cost_benefit_matrix.py  | 4 ++--
 .../regression_pipeline_tests/test_baseline_regression.py | 8 ++++++--
 evalml/tests/pipeline_tests/test_component_graph.py       | 7 +++----
 3 files changed, 11 insertions(+), 8 deletions(-)

diff --git a/evalml/tests/objective_tests/test_cost_benefit_matrix.py b/evalml/tests/objective_tests/test_cost_benefit_matrix.py
index 94746cb492..dd59639e23 100644
--- a/evalml/tests/objective_tests/test_cost_benefit_matrix.py
+++ b/evalml/tests/objective_tests/test_cost_benefit_matrix.py
@@ -31,10 +31,10 @@ def test_cbm_objective_automl(optimize_thresholds, X_y_binary):
 
     pipeline = automl.best_pipeline
     pipeline.fit(X, y)
-    assert not np.isnan(pipeline.predict(X, cbm)).values.any()
+    predictions = pipeline.predict(X, cbm)
+    assert not np.isnan(predictions.to_series()).values.any()
     assert not np.isnan(pipeline.predict_proba(X).to_dataframe()).values.any()
     assert not np.isnan(pipeline.score(X, y, [cbm])['Cost Benefit Matrix'])
-    assert not np.isnan(list(pipeline.predict(X, cbm))).any()
 
 
 @pytest.mark.parametrize("data_type", ['ww', 'pd'])
diff --git a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_baseline_regression.py b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_baseline_regression.py
index 9dbdbee2f6..1eaf3ccef4 100644
--- a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_baseline_regression.py
+++ b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_baseline_regression.py
@@ -1,4 +1,6 @@
 import numpy as np
+import pandas as pd
+from pandas.testing import assert_series_equal
 
 from evalml.pipelines import BaselineRegressionPipeline
 
@@ -13,7 +15,8 @@ def test_baseline_mean(X_y_regression):
     }
     clf = BaselineRegressionPipeline(parameters=parameters)
     clf.fit(X, y)
-    np.testing.assert_allclose(clf.predict(X), np.array([mean] * len(X)))
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series([mean] * len(X)), predictions.to_series())
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
 
@@ -27,5 +30,6 @@ def test_baseline_median(X_y_regression):
     }
     clf = BaselineRegressionPipeline(parameters=parameters)
     clf.fit(X, y)
-    np.testing.assert_allclose(clf.predict(X), np.array([median] * len(X)))
+    predictions = clf.predict(X)
+    assert_series_equal(pd.Series([median] * len(X)), predictions.to_series())
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index 60fc9b2917..2c6e5c61d4 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -523,7 +523,7 @@ def test_predict_empty_graph(X_y_binary):
 
     component_graph.fit(X, y)
     X_t = component_graph.predict(X)
-    assert_frame_equal(X_t, X)
+    assert_frame_equal(X, X_t)
 
 
 @patch('evalml.pipelines.components.OneHotEncoder.fit_transform')
@@ -537,8 +537,7 @@ def test_predict_transformer_end(mock_fit_transform, mock_transform, X_y_binary)
 
     component_graph.fit(X, y)
     output = component_graph.predict(X)
-
-    assert_frame_equal(output, pd.DataFrame(X))
+    assert_frame_equal(pd.DataFrame(X), output.to_dataframe())
 
 
 def test_no_instantiate_before_fit(X_y_binary):
@@ -631,7 +630,7 @@ def test_component_graph_evaluation_plumbing(mock_transa, mock_transb, mock_tran
     assert_frame_equal(mock_preda.call_args[0][0], X)
     assert_frame_equal(mock_predb.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6)}, columns=['feature trans', 'feature a']))
     assert_frame_equal(mock_predc.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6), 'estimator a': [0, 0, 0, 1, 0, 0], 'feature b': np.ones(6) * 2, 'estimator b': [0, 0, 0, 0, 1, 0], 'feature c': np.ones(6) * 3}, columns=['feature trans', 'feature a', 'estimator a', 'feature b', 'estimator b', 'feature c']))
-    assert_series_equal(predict_out, pd.Series([0, 0, 0, 0, 0, 1]))
+    assert_series_equal(pd.Series([0, 0, 0, 0, 0, 1], dtype="Int64"), predict_out.to_series())
 
 
 def test_input_feature_names(example_graph):

From b2244b94670bc7099a8949b98adb37c39b03f04a Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 17:39:24 -0500
Subject: [PATCH 35/98] fix prediction explanation algo tests

---
 .../prediction_explanations/_algorithms.py                    | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/evalml/model_understanding/prediction_explanations/_algorithms.py b/evalml/model_understanding/prediction_explanations/_algorithms.py
index 01408a5d0a..ff8a069c5c 100644
--- a/evalml/model_understanding/prediction_explanations/_algorithms.py
+++ b/evalml/model_understanding/prediction_explanations/_algorithms.py
@@ -6,7 +6,7 @@
 
 from evalml.model_family.model_family import ModelFamily
 from evalml.problem_types.problem_types import ProblemTypes
-from evalml.utils import get_logger
+from evalml.utils import _convert_woodwork_types_wrapper, get_logger
 
 logger = get_logger(__file__)
 
@@ -46,7 +46,6 @@ def _compute_shap_values(pipeline, features, training_data=None):
     estimator = pipeline.estimator
     if estimator.model_family == ModelFamily.BASELINE:
         raise ValueError("You passed in a baseline pipeline. These are simple enough that SHAP values are not needed.")
-
     feature_names = features.columns
 
     # This is to make sure all dtypes are numeric - SHAP algorithms will complain otherwise.
@@ -83,6 +82,7 @@ def _compute_shap_values(pipeline, features, training_data=None):
         # More than 100 datapoints can negatively impact runtime according to SHAP
         # https://github.com/slundberg/shap/blob/master/shap/explainers/kernel.py#L114
         sampled_training_data_features = pipeline.compute_estimator_features(shap.sample(training_data, 100))
+        sampled_training_data_features = _convert_woodwork_types_wrapper(sampled_training_data_features.to_dataframe())
         sampled_training_data_features = check_array(sampled_training_data_features)
 
         if pipeline.problem_type == ProblemTypes.REGRESSION:

From da5c82d47fbf944b96add6c2e52467ec19a43f07 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 18:41:11 -0500
Subject: [PATCH 36/98] fix explainer tests and pipeline misc tests

---
 .../prediction_explanations/_algorithms.py    |  1 +
 .../_user_interface.py                        |  2 +-
 .../prediction_explanations/explainers.py     |  3 ++
 .../test_explainers.py                        | 28 +++++++++----------
 .../test_binary_classification.py             | 11 ++++----
 .../test_time_series_baseline_regression.py   |  7 +++--
 6 files changed, 28 insertions(+), 24 deletions(-)

diff --git a/evalml/model_understanding/prediction_explanations/_algorithms.py b/evalml/model_understanding/prediction_explanations/_algorithms.py
index ff8a069c5c..15ef505df9 100644
--- a/evalml/model_understanding/prediction_explanations/_algorithms.py
+++ b/evalml/model_understanding/prediction_explanations/_algorithms.py
@@ -46,6 +46,7 @@ def _compute_shap_values(pipeline, features, training_data=None):
     estimator = pipeline.estimator
     if estimator.model_family == ModelFamily.BASELINE:
         raise ValueError("You passed in a baseline pipeline. These are simple enough that SHAP values are not needed.")
+
     feature_names = features.columns
 
     # This is to make sure all dtypes are numeric - SHAP algorithms will complain otherwise.
diff --git a/evalml/model_understanding/prediction_explanations/_user_interface.py b/evalml/model_understanding/prediction_explanations/_user_interface.py
index 74d7a3547b..722f1beb6f 100644
--- a/evalml/model_understanding/prediction_explanations/_user_interface.py
+++ b/evalml/model_understanding/prediction_explanations/_user_interface.py
@@ -212,7 +212,7 @@ def _make_single_prediction_shap_table(pipeline, input_features, top_k=3, traini
         str: Table
     """
     pipeline_features = pipeline.compute_estimator_features(input_features)
-
+    pipeline_features = pipeline_features.to_dataframe()
     shap_values = _compute_shap_values(pipeline, pipeline_features, training_data)
     normalized_shap_values = _normalize_shap_values(shap_values)
 
diff --git a/evalml/model_understanding/prediction_explanations/explainers.py b/evalml/model_understanding/prediction_explanations/explainers.py
index 8e4ae523eb..4d1e3850d3 100644
--- a/evalml/model_understanding/prediction_explanations/explainers.py
+++ b/evalml/model_understanding/prediction_explanations/explainers.py
@@ -174,11 +174,14 @@ def explain_predictions_best_worst(pipeline, input_features, y_true, num_to_expl
     try:
         if pipeline.problem_type == ProblemTypes.REGRESSION:
             y_pred = pipeline.predict(input_features)
+            y_pred = y_pred.to_series()
             y_pred_values = None
             errors = metric(y_true, y_pred)
         else:
             y_pred = pipeline.predict_proba(input_features)
+            y_pred = y_pred.to_dataframe()
             y_pred_values = pipeline.predict(input_features)
+            y_pred_values = y_pred_values.to_series()
             errors = metric(pipeline._encode_targets(y_true), y_pred)
     except Exception as e:
         tb = traceback.format_tb(sys.exc_info()[2])
diff --git a/evalml/tests/model_understanding_tests/prediction_explanations_tests/test_explainers.py b/evalml/tests/model_understanding_tests/prediction_explanations_tests/test_explainers.py
index be11b5d0db..6e6070edaf 100644
--- a/evalml/tests/model_understanding_tests/prediction_explanations_tests/test_explainers.py
+++ b/evalml/tests/model_understanding_tests/prediction_explanations_tests/test_explainers.py
@@ -154,7 +154,7 @@ def test_explain_prediction(mock_normalize_shap_values,
     pipeline.classes_ = ["class_0", "class_1", "class_2"]
 
     # By the time we call transform, we are looking at only one row of the input data.
-    pipeline.compute_estimator_features.return_value = pd.DataFrame({"a": [10], "b": [20], "c": [30], "d": [40]})
+    pipeline.compute_estimator_features.return_value = ww.DataTable(pd.DataFrame({"a": [10], "b": [20], "c": [30], "d": [40]}))
     features = pd.DataFrame({"a": [1], "b": [2]})
     training_data = pd.DataFrame()
     if input_type == "ww":
@@ -442,7 +442,7 @@ def _add_custom_index(answer, index_best, index_worst, output_format):
         abs_error_mock = MagicMock(__name__="abs_error")
         abs_error_mock.return_value = pd.Series([4, 1], dtype="int")
         mock_default_metrics.__getitem__.return_value = abs_error_mock
-        pipeline.predict.return_value = pd.Series([2, 1])
+        pipeline.predict.return_value = ww.DataColumn(pd.Series([2, 1]))
         y_true = pd.Series([3, 2], index=custom_index)
         answer = _add_custom_index(answer, index_best=custom_index[1],
                                    index_worst=custom_index[0], output_format=output_format)
@@ -451,8 +451,8 @@ def _add_custom_index(answer, index_best, index_worst, output_format):
         cross_entropy_mock = MagicMock(__name__="cross_entropy")
         mock_default_metrics.__getitem__.return_value = cross_entropy_mock
         cross_entropy_mock.return_value = pd.Series([0.2, 0.78])
-        pipeline.predict_proba.return_value = pd.DataFrame({"benign": [0.05, 0.1], "malignant": [0.95, 0.9]})
-        pipeline.predict.return_value = pd.Series(["malignant"] * 2)
+        pipeline.predict_proba.return_value = ww.DataTable(pd.DataFrame({"benign": [0.05, 0.1], "malignant": [0.95, 0.9]}))
+        pipeline.predict.return_value = ww.DataColumn(pd.Series(["malignant"] * 2))
         y_true = pd.Series(["malignant", "benign"], index=custom_index)
         answer = _add_custom_index(answer, index_best=custom_index[0],
                                    index_worst=custom_index[1], output_format=output_format)
@@ -464,9 +464,9 @@ def _add_custom_index(answer, index_best, index_worst, output_format):
         cross_entropy_mock = MagicMock(__name__="cross_entropy")
         mock_default_metrics.__getitem__.return_value = cross_entropy_mock
         cross_entropy_mock.return_value = pd.Series([0.15, 0.34])
-        pipeline.predict_proba.return_value = pd.DataFrame({"setosa": [0.8, 0.2], "versicolor": [0.1, 0.75],
-                                                            "virginica": [0.1, 0.05]})
-        pipeline.predict.return_value = ["setosa", "versicolor"]
+        pipeline.predict_proba.return_value = ww.DataTable(pd.DataFrame({"setosa": [0.8, 0.2], "versicolor": [0.1, 0.75],
+                                                                         "virginica": [0.1, 0.05]}))
+        pipeline.predict.return_value = ww.DataColumn(pd.Series(["setosa", "versicolor"]))
         y_true = pd.Series(["setosa", "versicolor"], index=custom_index)
         answer = _add_custom_index(answer, index_best=custom_index[0],
                                    index_worst=custom_index[1], output_format=output_format)
@@ -503,18 +503,18 @@ def test_explain_predictions_custom_index(mock_make_table, problem_type, output_
     pipeline.name = "Test Pipeline Name"
 
     if problem_type == ProblemTypes.REGRESSION:
-        pipeline.predict.return_value = pd.Series([2, 1])
+        pipeline.predict.return_value = ww.DataColumn(pd.Series([2, 1]))
     elif problem_type == ProblemTypes.BINARY:
         pipeline.classes_.return_value = ["benign", "malignant"]
-        pipeline.predict.return_value = pd.Series(["malignant"] * 2)
-        pipeline.predict_proba.return_value = pd.DataFrame({"benign": [0.05, 0.1], "malignant": [0.95, 0.9]})
+        pipeline.predict.return_value = ww.DataColumn(pd.Series(["malignant"] * 2))
+        pipeline.predict_proba.return_value = ww.DataTable(pd.DataFrame({"benign": [0.05, 0.1], "malignant": [0.95, 0.9]}))
     else:
         if output_format == "text":
             mock_make_table.return_value = multiclass_table
         pipeline.classes_.return_value = ["setosa", "versicolor", "virginica"]
-        pipeline.predict.return_value = pd.Series(["setosa", "versicolor"])
-        pipeline.predict_proba.return_value = pd.DataFrame({"setosa": [0.8, 0.2], "versicolor": [0.1, 0.75],
-                                                            "virginica": [0.1, 0.05]})
+        pipeline.predict.return_value = ww.DataColumn(pd.Series(["setosa", "versicolor"]))
+        pipeline.predict_proba.return_value = ww.DataTable(pd.DataFrame({"setosa": [0.8, 0.2], "versicolor": [0.1, 0.75],
+                                                                         "virginica": [0.1, 0.05]}))
 
     report = explain_predictions(pipeline, input_features, training_data=input_features, output_format=output_format)
     if output_format == "text":
@@ -578,7 +578,7 @@ def test_explain_predictions_best_worst_custom_metric(mock_make_table, output_fo
     pipeline.problem_type = ProblemTypes.REGRESSION
     pipeline.name = "Test Pipeline Name"
 
-    pipeline.predict.return_value = pd.Series([2, 1])
+    pipeline.predict.return_value = ww.DataColumn(pd.Series([2, 1]))
     y_true = pd.Series([3, 2])
 
     def sum(y_true, y_pred):
diff --git a/evalml/tests/pipeline_tests/classification_pipeline_tests/test_binary_classification.py b/evalml/tests/pipeline_tests/classification_pipeline_tests/test_binary_classification.py
index 58d3398066..5a2486459a 100644
--- a/evalml/tests/pipeline_tests/classification_pipeline_tests/test_binary_classification.py
+++ b/evalml/tests/pipeline_tests/classification_pipeline_tests/test_binary_classification.py
@@ -2,17 +2,17 @@
 
 import pandas as pd
 import pytest
+import woodwork as ww
 
 
-@patch('evalml.pipelines.ClassificationPipeline._decode_targets')
-@patch('evalml.objectives.BinaryClassificationObjective.decision_function')
-@patch('evalml.pipelines.components.Estimator.predict_proba')
-@patch('evalml.pipelines.components.Estimator.predict')
+@patch('evalml.pipelines.ClassificationPipeline._decode_targets', return_value=[0, 1])
+@patch('evalml.objectives.BinaryClassificationObjective.decision_function', return_value=pd.Series([1, 0]))
+@patch('evalml.pipelines.components.Estimator.predict_proba', return_value=ww.DataTable(pd.DataFrame([[0.1, 0.2], [0.1, 0.2]])))
+@patch('evalml.pipelines.components.Estimator.predict', return_value=ww.DataColumn(pd.Series([1, 0])))
 def test_binary_classification_pipeline_predict(mock_predict, mock_predict_proba,
                                                 mock_obj_decision, mock_decode,
                                                 X_y_binary, dummy_binary_pipeline_class):
     mock_objs = [mock_decode, mock_predict]
-    mock_decode.return_value = [0, 1]
     X, y = X_y_binary
     binary_pipeline = dummy_binary_pipeline_class(parameters={"Logistic Regression Classifier": {"n_jobs": 1}})
     # test no objective passed and no custom threshold uses underlying estimator's predict method
@@ -30,7 +30,6 @@ def test_binary_classification_pipeline_predict(mock_predict, mock_predict_proba
 
     mock_objs = [mock_decode, mock_predict_proba]
     # test custom threshold set but no objective passed
-    mock_predict_proba.return_value = pd.DataFrame([[0.1, 0.2], [0.1, 0.2]])
     binary_pipeline.threshold = 0.6
     binary_pipeline._encoder.classes_ = [0, 1]
     binary_pipeline.predict(X)
diff --git a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_time_series_baseline_regression.py b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_time_series_baseline_regression.py
index cefa1e85dd..3a092bd6ac 100644
--- a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_time_series_baseline_regression.py
+++ b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_time_series_baseline_regression.py
@@ -3,6 +3,7 @@
 import numpy as np
 import pandas as pd
 import pytest
+from pandas.testing import assert_index_equal, assert_series_equal
 
 from evalml.pipelines import TimeSeriesBaselineRegressionPipeline
 
@@ -13,7 +14,7 @@ def test_time_series_baseline(ts_data):
     clf = TimeSeriesBaselineRegressionPipeline(parameters={"pipeline": {"gap": 1, "max_delay": 1}})
     clf.fit(X, y)
 
-    np.testing.assert_allclose(clf.predict(X, y), y)
+    assert_series_equal(y.astype("Int64").reset_index(drop=True), clf.predict(X, y).to_series())
 
 
 def test_time_series_baseline_no_X(ts_data):
@@ -22,7 +23,7 @@ def test_time_series_baseline_no_X(ts_data):
     clf = TimeSeriesBaselineRegressionPipeline(parameters={"pipeline": {"gap": 1, "max_delay": 1}})
     clf.fit(X=None, y=y)
 
-    np.testing.assert_allclose(clf.predict(X=None, y=y), y)
+    assert_series_equal(y.astype("Int64").reset_index(drop=True), clf.predict(X=None, y=y).to_series())
 
 
 @pytest.mark.parametrize("only_use_y", [True, False])
@@ -49,5 +50,5 @@ def test_time_series_baseline_score_offset(mock_score, gap, max_delay, only_use_
     assert not preds.isna().any()
 
     # Target used for scoring matches expected dates
-    pd.testing.assert_index_equal(target.index, target_index)
+    assert_index_equal(target.index, target_index)
     np.testing.assert_equal(target.values, expected_target)

From 18a7ee4808d811d0f886019bfcb78f20728dfa00 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 19:45:22 -0500
Subject: [PATCH 37/98] holy potato fix partial dependence tests

---
 evalml/model_understanding/graphs.py            | 17 +++++++++++------
 .../latest_dependency_versions.txt              |  2 +-
 .../model_understanding_tests/test_graphs.py    |  8 ++------
 3 files changed, 14 insertions(+), 13 deletions(-)

diff --git a/evalml/model_understanding/graphs.py b/evalml/model_understanding/graphs.py
index adf9c91024..dbd85e5be3 100644
--- a/evalml/model_understanding/graphs.py
+++ b/evalml/model_understanding/graphs.py
@@ -454,6 +454,7 @@ def partial_dependence(pipeline, X, feature, grid_resolution=100):
             "positive" class.
 
     """
+    from evalml.pipelines.components.utils import scikit_learn_wrapped_estimator
     X = _convert_to_woodwork_structure(X)
     X = _convert_woodwork_types_wrapper(X.to_dataframe())
 
@@ -461,15 +462,19 @@ def partial_dependence(pipeline, X, feature, grid_resolution=100):
         raise ValueError("Pipeline to calculate partial dependence for must be fitted")
     if pipeline.model_family == ModelFamily.BASELINE:
         raise ValueError("Partial dependence plots are not supported for Baseline pipelines")
-    if isinstance(pipeline, evalml.pipelines.ClassificationPipeline):
-        pipeline._estimator_type = "classifier"
-    elif isinstance(pipeline, evalml.pipelines.RegressionPipeline):
-        pipeline._estimator_type = "regressor"
-    pipeline.feature_importances_ = pipeline.feature_importance
+
     if ((isinstance(feature, int) and X.iloc[:, feature].isnull().sum()) or (isinstance(feature, str) and X[feature].isnull().sum())):
         warnings.warn("There are null values in the features, which will cause NaN values in the partial dependence output. Fill in these values to remove the NaN values.", NullsInColumnWarning)
     try:
-        avg_pred, values = sk_partial_dependence(pipeline, X=X, features=[feature], grid_resolution=grid_resolution)
+        wrapped = scikit_learn_wrapped_estimator(pipeline)
+        if isinstance(pipeline, evalml.pipelines.ClassificationPipeline):
+            wrapped._estimator_type = "classifier"
+            wrapped.classes_ = pipeline.classes_
+        elif isinstance(pipeline, evalml.pipelines.RegressionPipeline):
+            wrapped._estimator_type = "regressor"
+        wrapped.feature_importances_ = pipeline.feature_importance
+        wrapped._is_fitted = True
+        avg_pred, values = sk_partial_dependence(wrapped, X=X, features=[feature], grid_resolution=grid_resolution)
     finally:
         # Delete scikit-learn attributes that were temporarily set
         del pipeline._estimator_type
diff --git a/evalml/tests/dependency_update_check/latest_dependency_versions.txt b/evalml/tests/dependency_update_check/latest_dependency_versions.txt
index ca036df943..e218936568 100644
--- a/evalml/tests/dependency_update_check/latest_dependency_versions.txt
+++ b/evalml/tests/dependency_update_check/latest_dependency_versions.txt
@@ -12,7 +12,7 @@ networkx==2.5
 nlp-primitives==1.1.0
 numpy==1.19.5
 pandas==1.1.5
-plotly==4.14.2
+plotly==4.14.3
 psutil==5.8.0
 requirements-parser==0.2.0
 scikit-learn==0.23.2
diff --git a/evalml/tests/model_understanding_tests/test_graphs.py b/evalml/tests/model_understanding_tests/test_graphs.py
index bc5cb8c73e..1596491cb3 100644
--- a/evalml/tests/model_understanding_tests/test_graphs.py
+++ b/evalml/tests/model_understanding_tests/test_graphs.py
@@ -727,7 +727,7 @@ def check_partial_dependence_dataframe(pipeline, part_dep, grid_size=20):
 def test_partial_dependence_problem_types(data_type, problem_type, X_y_binary, X_y_multi, X_y_regression,
                                           logistic_regression_binary_pipeline_class,
                                           logistic_regression_multiclass_pipeline_class,
-                                          linear_regression_pipeline_class):
+                                          linear_regression_pipeline_class, make_data_type):
     if problem_type == ProblemTypes.BINARY:
         X, y = X_y_binary
         pipeline = logistic_regression_binary_pipeline_class(parameters={"Logistic Regression Classifier": {"n_jobs": 1}})
@@ -740,11 +740,7 @@ def test_partial_dependence_problem_types(data_type, problem_type, X_y_binary, X
         X, y = X_y_regression
         pipeline = linear_regression_pipeline_class(parameters={"Linear Regressor": {"n_jobs": 1}})
 
-    if data_type != "np":
-        X = pd.DataFrame(X)
-    if data_type == "ww":
-        X = ww.DataTable(X)
-
+    X = make_data_type(data_type, X)
     pipeline.fit(X, y)
     part_dep = partial_dependence(pipeline, X, feature=0, grid_resolution=20)
     check_partial_dependence_dataframe(pipeline, part_dep)

From 8cc1e525525a692b209ced18f159c8915e24cfed Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 20:45:51 -0500
Subject: [PATCH 38/98] remove unnecessary try/finally block

---
 evalml/model_understanding/graphs.py | 24 ++++++++++--------------
 1 file changed, 10 insertions(+), 14 deletions(-)

diff --git a/evalml/model_understanding/graphs.py b/evalml/model_understanding/graphs.py
index dbd85e5be3..251d3db52f 100644
--- a/evalml/model_understanding/graphs.py
+++ b/evalml/model_understanding/graphs.py
@@ -465,20 +465,16 @@ def partial_dependence(pipeline, X, feature, grid_resolution=100):
 
     if ((isinstance(feature, int) and X.iloc[:, feature].isnull().sum()) or (isinstance(feature, str) and X[feature].isnull().sum())):
         warnings.warn("There are null values in the features, which will cause NaN values in the partial dependence output. Fill in these values to remove the NaN values.", NullsInColumnWarning)
-    try:
-        wrapped = scikit_learn_wrapped_estimator(pipeline)
-        if isinstance(pipeline, evalml.pipelines.ClassificationPipeline):
-            wrapped._estimator_type = "classifier"
-            wrapped.classes_ = pipeline.classes_
-        elif isinstance(pipeline, evalml.pipelines.RegressionPipeline):
-            wrapped._estimator_type = "regressor"
-        wrapped.feature_importances_ = pipeline.feature_importance
-        wrapped._is_fitted = True
-        avg_pred, values = sk_partial_dependence(wrapped, X=X, features=[feature], grid_resolution=grid_resolution)
-    finally:
-        # Delete scikit-learn attributes that were temporarily set
-        del pipeline._estimator_type
-        del pipeline.feature_importances_
+    wrapped = scikit_learn_wrapped_estimator(pipeline)
+    if isinstance(pipeline, evalml.pipelines.ClassificationPipeline):
+        wrapped._estimator_type = "classifier"
+        wrapped.classes_ = pipeline.classes_
+    elif isinstance(pipeline, evalml.pipelines.RegressionPipeline):
+        wrapped._estimator_type = "regressor"
+    wrapped.feature_importances_ = pipeline.feature_importance
+    wrapped._is_fitted = True
+    avg_pred, values = sk_partial_dependence(wrapped, X=X, features=[feature], grid_resolution=grid_resolution)
+
     classes = None
     if isinstance(pipeline, evalml.pipelines.BinaryClassificationPipeline):
         classes = [pipeline.classes_[1]]

From 318d7857dd5dd54831be2c9e88dc6a27983fefbd Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 13 Jan 2021 21:44:03 -0500
Subject: [PATCH 39/98] update regression test to use OHE instead of target

---
 .../regression_pipeline_tests/test_regression.py               | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
index 6732e7bf1b..10481b9b3a 100644
--- a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
+++ b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
@@ -28,8 +28,9 @@ def test_woodwork_regression_pipeline(linear_regression_pipeline_class):
 
 def test_custom_indices():
     # custom regression pipeline
+    # don't need to use target encoder, which wont run on core dependencies true tests
     class MyTargetPipeline(RegressionPipeline):
-        component_graph = ['Imputer', 'Target Encoder', 'Linear Regressor']
+        component_graph = ['Imputer', 'One Hot Encoder', 'Linear Regressor']
         custom_name = "Target Pipeline"
 
     X = pd.DataFrame({"a": ["a", "b", "a", "a", "a", "c", "c", "c"], "b": [0, 1, 1, 1, 1, 1, 0, 1]})

From b27eca8bc0a5771e5da90dbcf57b3f69e8316e19 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 14 Jan 2021 00:09:45 -0500
Subject: [PATCH 40/98] push for tests


From 20a8116e1c59596a882f39cb46a9b3bc8352fdf5 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 14 Jan 2021 20:01:48 -0500
Subject: [PATCH 41/98] hmmm... adding code to component graph to handle
 carrying original logical types set

---
 evalml/pipelines/classification_pipeline.py   |  1 +
 evalml/pipelines/component_graph.py           | 53 ++++++++++++++++---
 .../transformers/encoders/target_encoder.py   |  4 +-
 .../preprocessing/text_featurizer.py          |  1 -
 .../transformers/scalers/standard_scaler.py   | 10 ++++
 .../components/transformers/transformer.py    |  1 +
 .../component_tests/test_target_encoder.py    | 16 +++---
 7 files changed, 66 insertions(+), 20 deletions(-)

diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index 252b43f812..ee2352e897 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -39,6 +39,7 @@ def fit(self, X, y):
             self
 
         """
+        # import pdb; pdb.set_trace()
         X = _convert_to_woodwork_structure(X)
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 818ac4fd6c..212c62dee5 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -91,6 +91,7 @@ def fit(self, X, y):
             X (pd.DataFrame): The input training data of shape [n_samples, n_features]
             y (pd.Series): The target training data of length [n_samples]
         """
+        # import pdb; pdb.set_trace()
         self._compute_features(self.compute_order, X, y, fit=True)
         return self
 
@@ -186,9 +187,9 @@ def _compute_features(self, component_list, X, y=None, fit=False):
         if len(component_list) == 0:
             return X
         X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
 
         output_cache = {}
+        original_logical_types = X.logical_types
         for component_name in component_list:
             component_instance = self.get_component(component_name)
             if not isinstance(component_instance, ComponentBase):
@@ -202,15 +203,23 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                     y_input = output_cache[parent_input]
                 else:
                     parent_x = output_cache.get(parent_input, output_cache.get(f'{parent_input}.x'))
-                    if isinstance(parent_x, pd.Series):
-                        parent_x = pd.DataFrame(parent_x, columns=[parent_input])
-                    if isinstance(parent_x, ww.DataColumn):
-                        parent_x_series = parent_x.to_series()
-                        parent_x = pd.DataFrame(parent_x_series, columns=[parent_input])
-                        parent_x = _convert_to_woodwork_structure(parent_x).to_dataframe()
+                    # ideally, we want this to be woodwork stuff that's outputted and concatted.
+                    # if isinstance(parent_x, pd.Series):
+                    #     parent_x = pd.DataFrame(parent_x, columns=[parent_input])
+                    # if isinstance(parent_x, ww.DataColumn):
+                    #     parent_x_series = parent_x.to_series()
+                    #     parent_x = pd.DataFrame(parent_x_series, columns=[parent_input])
+                    #     parent_x = _convert_to_woodwork_structure(parent_x).to_dataframe()
                     x_inputs.append(parent_x)
             input_x, input_y = self._consolidate_inputs(x_inputs, y_input, X, y)
-
+            # check for original types and make sure they're preserved...
+            # import pdb; pdb.set_trace()
+            # for t in original_logical_types:
+            #     if t in input_x.columns:
+            #         input_x = input_x.set_types({t: original_logical_types[t]})
+            for t in original_logical_types:
+                if t in input_x.columns and "numeric" not in input_x[t].semantic_tags:
+                    input_x = input_x.set_types({t: original_logical_types[t]})
             self.input_feature_names.update({component_name: list(input_x.columns)})
 
             if isinstance(component_instance, Transformer):
@@ -235,6 +244,29 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                 output_cache[component_name] = output
         return output_cache
 
+    # @staticmethod
+    # def _consolidate_inputs(x_inputs, y_input, X, y):
+    #     """ Combines any/all X and y inputs for a component, including handling defaults
+
+    #     Arguments:
+    #         x_inputs (list(pd.DataFrame)): Data to be used as X input for a component
+    #         y_input (pd.Series, None): If present, the Series to use as y input for a component, different from the original y
+    #         X (pd.DataFrame): The original X input, to be used if there is no parent X input
+    #         y (pd.Series): The original y input, to be used if there is no parent y input
+
+    #     Returns:
+    #         pd.DataFrame, pd.Series: The X and y transformed values to evaluate a component with
+    #     """
+
+    #     if len(x_inputs) == 0:
+    #         return_x = X
+    #     else:
+    #         return_x = pd.concat([x_in.to_dataframe() if isinstance(x_in, ww.DataTable) else x_in for x_in in x_inputs], axis=1)
+    #     return_y = y
+    #     if y_input is not None:
+    #         return_y = y_input
+    #     return return_x, return_y
+
     @staticmethod
     def _consolidate_inputs(x_inputs, y_input, X, y):
         """ Combines any/all X and y inputs for a component, including handling defaults
@@ -248,14 +280,19 @@ def _consolidate_inputs(x_inputs, y_input, X, y):
         Returns:
             pd.DataFrame, pd.Series: The X and y transformed values to evaluate a component with
         """
+        merged_types_dict = {}
 
         if len(x_inputs) == 0:
             return_x = X
         else:
+            for x_in in x_inputs:
+                merged_types_dict.update(x_in.logical_types)
             return_x = pd.concat([x_in.to_dataframe() if isinstance(x_in, ww.DataTable) else x_in for x_in in x_inputs], axis=1)
         return_y = y
         if y_input is not None:
             return_y = y_input
+        return_x = _convert_to_woodwork_structure(return_x)
+        return_x.set_types(merged_types_dict)
         return return_x, return_y
 
     def get_component(self, component_name):
diff --git a/evalml/pipelines/components/transformers/encoders/target_encoder.py b/evalml/pipelines/components/transformers/encoders/target_encoder.py
index dfbe849890..e7bbbe10f2 100644
--- a/evalml/pipelines/components/transformers/encoders/target_encoder.py
+++ b/evalml/pipelines/components/transformers/encoders/target_encoder.py
@@ -52,15 +52,13 @@ def __init__(self,
                          random_state=random_state)
 
     def fit(self, X, y):
+        # do we want to do this?
         if isinstance(X, pd.DataFrame):
             X.reset_index(drop=True, inplace=True)
         if isinstance(y, pd.Series):
             y.reset_index(drop=True, inplace=True)
         return super().fit(X, y)
 
-    def transform(self, X, y=None):
-        return super().transform(X, y)
-
     def fit_transform(self, X, y):
         return self.fit(X, y).transform(X, y)
 
diff --git a/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py b/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
index 24cc63c8ec..1c99bf9a23 100644
--- a/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
@@ -99,7 +99,6 @@ def transform(self, X, y=None):
         X = _convert_to_woodwork_structure(X)
         if self._features is None or len(self._features) == 0:
             return X
-
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         text_columns = self._get_text_columns(X)
         es = self._make_entity_set(X, text_columns)
diff --git a/evalml/pipelines/components/transformers/scalers/standard_scaler.py b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
index 38d70c4bcc..b5d7709c1d 100644
--- a/evalml/pipelines/components/transformers/scalers/standard_scaler.py
+++ b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
@@ -30,7 +30,17 @@ def transform(self, X, y=None):
         X_index = X.index
         X_t = self._component_obj.transform(X)
         X_t_df = pd.DataFrame(X_t, columns=X_cols, index=X_index)
+        # import pdb; pdb.set_trace()
         return _convert_to_woodwork_structure(X_t_df)
 
     def fit_transform(self, X, y=None):
         return self.fit(X, y).transform(X, y)
+
+    def fit(self, X, y=None):
+        X = _convert_to_woodwork_structure(X)
+        X = _convert_woodwork_types_wrapper(X.to_dataframe())
+        if y is not None:
+            y = _convert_to_woodwork_structure(y)
+            y = _convert_woodwork_types_wrapper(y.to_series())
+        self._component_obj.fit(X, y)
+        return self
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 18baff27be..ff4b403bf4 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -42,6 +42,7 @@ def transform(self, X, y=None):
                 y = _convert_woodwork_types_wrapper(y.to_series())
             X_cols = X.columns
             X_index = X.index
+            # category treated differently from object...
             X_t = self._component_obj.transform(X, y)
         except AttributeError:
             raise MethodPropertyNotFoundError("Transformer requires a transform method or a component_obj that implements transform")
diff --git a/evalml/tests/component_tests/test_target_encoder.py b/evalml/tests/component_tests/test_target_encoder.py
index c20d9d9f64..5d7dc5a788 100644
--- a/evalml/tests/component_tests/test_target_encoder.py
+++ b/evalml/tests/component_tests/test_target_encoder.py
@@ -50,14 +50,14 @@ def test_null_values_in_dataframe():
                       'col_2': ["a", "b", "a", "c", "b"],
                       'col_3': ["a", "a", "a", "a", "a"]})
     y = pd.Series([0, 1, 1, 1, 0])
-    encoder = TargetEncoder(handle_missing='value')
-    encoder.fit(X, y)
-    X_t = encoder.transform(X)
-    X_expected = pd.DataFrame({'col_1': [0.6, 0.6, 0.6, 0.6, 0.6],
-                               'col_2': [0.526894, 0.526894, 0.526894, 0.6, 0.526894],
-                               'col_3': [0.6, 0.6, 0.6, 0.6, 0.6, ]})
-
-    assert_frame_equal(X_expected, X_t.to_dataframe())
+    # encoder = TargetEncoder(handle_missing='value')
+    # encoder.fit(X, y)
+    # X_t = encoder.transform(X)
+    # X_expected = pd.DataFrame({'col_1': [0.6, 0.6, 0.6, 0.6, 0.6],
+    #                            'col_2': [0.526894, 0.526894, 0.526894, 0.6, 0.526894],
+    #                            'col_3': [0.6, 0.6, 0.6, 0.6, 0.6, ]})
+
+    # assert_frame_equal(X_expected, X_t.to_dataframe())
 
     encoder = TargetEncoder(handle_missing='return_nan')
     encoder.fit(X, y)

From f43d4d1c041d43751969bc1fbb42cb5d66eaf106 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 14 Jan 2021 20:30:49 -0500
Subject: [PATCH 42/98] add check for data column and data check in component
 graph

---
 evalml/pipelines/component_graph.py                 | 11 +++++++++--
 evalml/tests/pipeline_tests/test_component_graph.py | 12 ++++++------
 2 files changed, 15 insertions(+), 8 deletions(-)

diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 212c62dee5..571aa16529 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -285,9 +285,16 @@ def _consolidate_inputs(x_inputs, y_input, X, y):
         if len(x_inputs) == 0:
             return_x = X
         else:
+            x_to_concat = []
             for x_in in x_inputs:
-                merged_types_dict.update(x_in.logical_types)
-            return_x = pd.concat([x_in.to_dataframe() if isinstance(x_in, ww.DataTable) else x_in for x_in in x_inputs], axis=1)
+                if isinstance(x_in, ww.DataTable):
+                    merged_types_dict.update(x_in.logical_types)
+                    x_to_concat.append(x_in.to_dataframe())
+                elif isinstance(x_in, ww.DataColumn):
+                    x_to_concat.append(x_in.to_series())
+                else:  # shouldnt reach here.
+                    x_to_concat.append(x_in)
+            return_x = pd.concat(x_to_concat, axis=1)
         return_y = y
         if y_input is not None:
             return_y = y_input
diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index 2c6e5c61d4..8e66ee7176 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -418,7 +418,7 @@ def test_fit_features_nonlinear(mock_predict, mock_fit, mock_fit_transform, exam
 @patch('evalml.pipelines.components.Estimator.predict')
 def test_predict(mock_predict, mock_fit, example_graph, X_y_binary):
     X, y = X_y_binary
-    mock_predict.return_value = pd.Series(y)
+    mock_predict.return_value = ww.DataColumn(pd.Series(y))
     component_graph = ComponentGraph(example_graph).instantiate({})
     component_graph.fit(X, y)
 
@@ -431,7 +431,7 @@ def test_predict(mock_predict, mock_fit, example_graph, X_y_binary):
 @patch('evalml.pipelines.components.Estimator.predict')
 def test_predict_repeat_estimator(mock_predict, mock_fit, X_y_binary):
     X, y = X_y_binary
-    mock_predict.return_value = pd.Series(y)
+    mock_predict.return_value = ww.DataColumn(pd.Series(y))
 
     graph = {'Imputer': [Imputer],
              'OneHot_RandomForest': [OneHotEncoder, 'Imputer.x'],
@@ -476,10 +476,10 @@ def test_compute_final_component_features_linear(mock_ohe, mock_imputer, X_y_bin
 @patch('evalml.pipelines.components.ElasticNetClassifier.predict')
 def test_compute_final_component_features_nonlinear(mock_en_predict, mock_rf_predict, mock_ohe, mock_imputer, example_graph, X_y_binary):
     X, y = X_y_binary
-    mock_imputer.return_value = pd.DataFrame(X)
-    mock_ohe.return_value = pd.DataFrame(X)
-    mock_en_predict.return_value = pd.Series(np.ones(X.shape[0]))
-    mock_rf_predict.return_value = pd.Series(np.zeros(X.shape[0]))
+    mock_imputer.return_value = ww.DataTable(pd.DataFrame(X))
+    mock_ohe.return_value = ww.DataTable(pd.DataFrame(X))
+    mock_en_predict.return_value = ww.DataColumn(pd.Series(np.ones(X.shape[0])))
+    mock_rf_predict.return_value = ww.DataColumn(pd.Series(np.zeros(X.shape[0])))
     X_expected = pd.DataFrame({'Random Forest': np.zeros(X.shape[0]), 'Elastic Net': np.ones(X.shape[0])})
     component_graph = ComponentGraph(example_graph).instantiate({})
     component_graph.fit(X, y)

From 5430ebc46845f5f7903d400612b501bf4d3e37be Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 14 Jan 2021 21:20:14 -0500
Subject: [PATCH 43/98] update component graph to handle naming

---
 evalml/pipelines/component_graph.py | 28 ++++++++++++++++++----------
 1 file changed, 18 insertions(+), 10 deletions(-)

diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 571aa16529..2d9fe1d1f2 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -196,6 +196,7 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                 raise ValueError('All components must be instantiated before fitting or predicting')
             x_inputs = []
             y_input = None
+            merged_types_dict = {}
             for parent_input in self.get_parents(component_name):
                 if parent_input[-2:] == '.y':
                     if y_input is not None:
@@ -210,6 +211,12 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                     #     parent_x_series = parent_x.to_series()
                     #     parent_x = pd.DataFrame(parent_x_series, columns=[parent_input])
                     #     parent_x = _convert_to_woodwork_structure(parent_x).to_dataframe()
+                    if isinstance(parent_x, ww.DataTable):
+                        merged_types_dict.update(parent_x.logical_types)
+                        parent_x = parent_x.to_dataframe()
+                    elif isinstance(parent_x, ww.DataColumn):
+                        # following what was previously here, but could probs be simplified.
+                        parent_x = pd.DataFrame(parent_x.to_series(), columns=[parent_input])
                     x_inputs.append(parent_x)
             input_x, input_y = self._consolidate_inputs(x_inputs, y_input, X, y)
             # check for original types and make sure they're preserved...
@@ -285,16 +292,17 @@ def _consolidate_inputs(x_inputs, y_input, X, y):
         if len(x_inputs) == 0:
             return_x = X
         else:
-            x_to_concat = []
-            for x_in in x_inputs:
-                if isinstance(x_in, ww.DataTable):
-                    merged_types_dict.update(x_in.logical_types)
-                    x_to_concat.append(x_in.to_dataframe())
-                elif isinstance(x_in, ww.DataColumn):
-                    x_to_concat.append(x_in.to_series())
-                else:  # shouldnt reach here.
-                    x_to_concat.append(x_in)
-            return_x = pd.concat(x_to_concat, axis=1)
+            # x_to_concat = []
+            # for x_in in x_inputs:
+            #     if isinstance(x_in, ww.DataTable):
+            #         merged_types_dict.update(x_in.logical_types)
+            #         x_to_concat.append(x_in.to_dataframe())
+            #     elif isinstance(x_in, ww.DataColumn):
+            #         # following what was previously here, but could probs be simplified.
+            #         x_to_concat.append(pd.DataFrame(x_in.to_series(), columns=[parent_input]))
+            #     else:  # shouldnt reach here.
+            #         x_to_concat.append(x_in)
+            return_x = pd.concat(x_inputs, axis=1)
         return_y = y
         if y_input is not None:
             return_y = y_input

From 16f58a9eccbcca52a43fc5ef7a24dfdeef0394ad Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 14 Jan 2021 21:53:48 -0500
Subject: [PATCH 44/98] fix docs

---
 evalml/utils/gen_utils.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/evalml/utils/gen_utils.py b/evalml/utils/gen_utils.py
index 8e54c5ff84..dc103218c5 100644
--- a/evalml/utils/gen_utils.py
+++ b/evalml/utils/gen_utils.py
@@ -358,7 +358,7 @@ def _convert_woodwork_types_wrapper(pd_data):
 
 def pad_with_nans(pd_data, num_to_pad):
     """Pad the beginning num_to_pad rows with nans.
-        TODO
+
     Arguments:
         pd_data (pd.DataFrame or pd.Series): Data to pad.
 

From b241e39767a6a417b7c2618c853df20520db2895 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 15 Jan 2021 10:04:10 -0500
Subject: [PATCH 45/98] uncomment test

---
 .../tests/component_tests/test_target_encoder.py | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/evalml/tests/component_tests/test_target_encoder.py b/evalml/tests/component_tests/test_target_encoder.py
index 5d7dc5a788..c20d9d9f64 100644
--- a/evalml/tests/component_tests/test_target_encoder.py
+++ b/evalml/tests/component_tests/test_target_encoder.py
@@ -50,14 +50,14 @@ def test_null_values_in_dataframe():
                       'col_2': ["a", "b", "a", "c", "b"],
                       'col_3': ["a", "a", "a", "a", "a"]})
     y = pd.Series([0, 1, 1, 1, 0])
-    # encoder = TargetEncoder(handle_missing='value')
-    # encoder.fit(X, y)
-    # X_t = encoder.transform(X)
-    # X_expected = pd.DataFrame({'col_1': [0.6, 0.6, 0.6, 0.6, 0.6],
-    #                            'col_2': [0.526894, 0.526894, 0.526894, 0.6, 0.526894],
-    #                            'col_3': [0.6, 0.6, 0.6, 0.6, 0.6, ]})
-
-    # assert_frame_equal(X_expected, X_t.to_dataframe())
+    encoder = TargetEncoder(handle_missing='value')
+    encoder.fit(X, y)
+    X_t = encoder.transform(X)
+    X_expected = pd.DataFrame({'col_1': [0.6, 0.6, 0.6, 0.6, 0.6],
+                               'col_2': [0.526894, 0.526894, 0.526894, 0.6, 0.526894],
+                               'col_3': [0.6, 0.6, 0.6, 0.6, 0.6, ]})
+
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
     encoder = TargetEncoder(handle_missing='return_nan')
     encoder.fit(X, y)

From 12c30aea49858e2fe0ef5a19d0f9afd4f132683d Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 15 Jan 2021 10:57:05 -0500
Subject: [PATCH 46/98] fix pipelines docs

---
 docs/source/user_guide/pipelines.ipynb | 20 ++++++++++++--------
 1 file changed, 12 insertions(+), 8 deletions(-)

diff --git a/docs/source/user_guide/pipelines.ipynb b/docs/source/user_guide/pipelines.ipynb
index 1eca6460c1..89d245cc72 100644
--- a/docs/source/user_guide/pipelines.ipynb
+++ b/docs/source/user_guide/pipelines.ipynb
@@ -357,12 +357,15 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {},
+   "metadata": {
+    "scrolled": false
+   },
    "outputs": [],
    "source": [
     "from evalml.pipelines.utils import generate_pipeline_code\n",
     "from evalml.pipelines import MulticlassClassificationPipeline\n",
     "import pandas as pd\n",
+    "from evalml.utils import _convert_to_woodwork_structure, _convert_woodwork_types_wrapper\n",
     "\n",
     "class MyDropNullColumns(Transformer):\n",
     "    \"\"\"Transformer to drop features whose percentage of NaN values exceeds a specified threshold\"\"\"\n",
@@ -389,8 +392,8 @@
     "\n",
     "    def fit(self, X, y=None):\n",
     "        pct_null_threshold = self.parameters[\"pct_null_threshold\"]\n",
-    "        if not isinstance(X, pd.DataFrame):\n",
-    "            X = pd.DataFrame(X)\n",
+    "        X = _convert_to_woodwork_structure(X)\n",
+    "        X = _convert_woodwork_types_wrapper(X.to_dataframe())\n",
     "        percent_null = X.isnull().mean()\n",
     "        if pct_null_threshold == 0.0:\n",
     "            null_cols = percent_null[percent_null > 0]\n",
@@ -408,9 +411,10 @@
     "            pd.DataFrame: Transformed X\n",
     "        \"\"\"\n",
     "\n",
-    "        if not isinstance(X, pd.DataFrame):\n",
-    "            X = pd.DataFrame(X)\n",
-    "        return X.drop(columns=self._cols_to_drop, axis=1)\n",
+    "        X = _convert_to_woodwork_structure(X)\n",
+    "        X = _convert_woodwork_types_wrapper(X.to_dataframe())\n",
+    "        X_t = X.drop(columns=self._cols_to_drop, axis=1)\n",
+    "        return _convert_to_woodwork_structure(X_t)\n",
     "\n",
     "class CustomPipeline(MulticlassClassificationPipeline):\n",
     "    name = \"Custom Pipeline\"\n",
@@ -451,9 +455,9 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.6"
+   "version": "3.7.5"
   }
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
\ No newline at end of file
+}

From 2d4a0e69a229108cb418402f056cd36ecd452511 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 15 Jan 2021 12:18:43 -0500
Subject: [PATCH 47/98] mini cleanup here

---
 evalml/pipelines/component_graph.py           | 45 +------------------
 .../time_series_baseline_estimator.py         |  8 ++--
 .../test_time_series_baseline_pipeline.py     | 16 +++----
 3 files changed, 14 insertions(+), 55 deletions(-)

diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 2d9fe1d1f2..60e6c56c59 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -204,13 +204,6 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                     y_input = output_cache[parent_input]
                 else:
                     parent_x = output_cache.get(parent_input, output_cache.get(f'{parent_input}.x'))
-                    # ideally, we want this to be woodwork stuff that's outputted and concatted.
-                    # if isinstance(parent_x, pd.Series):
-                    #     parent_x = pd.DataFrame(parent_x, columns=[parent_input])
-                    # if isinstance(parent_x, ww.DataColumn):
-                    #     parent_x_series = parent_x.to_series()
-                    #     parent_x = pd.DataFrame(parent_x_series, columns=[parent_input])
-                    #     parent_x = _convert_to_woodwork_structure(parent_x).to_dataframe()
                     if isinstance(parent_x, ww.DataTable):
                         merged_types_dict.update(parent_x.logical_types)
                         parent_x = parent_x.to_dataframe()
@@ -219,12 +212,8 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                         parent_x = pd.DataFrame(parent_x.to_series(), columns=[parent_input])
                     x_inputs.append(parent_x)
             input_x, input_y = self._consolidate_inputs(x_inputs, y_input, X, y)
-            # check for original types and make sure they're preserved...
-            # import pdb; pdb.set_trace()
-            # for t in original_logical_types:
-            #     if t in input_x.columns:
-            #         input_x = input_x.set_types({t: original_logical_types[t]})
             for t in original_logical_types:
+                # numeric is special(ints, floats. ex: targetencoder.)
                 if t in input_x.columns and "numeric" not in input_x[t].semantic_tags:
                     input_x = input_x.set_types({t: original_logical_types[t]})
             self.input_feature_names.update({component_name: list(input_x.columns)})
@@ -251,28 +240,6 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                 output_cache[component_name] = output
         return output_cache
 
-    # @staticmethod
-    # def _consolidate_inputs(x_inputs, y_input, X, y):
-    #     """ Combines any/all X and y inputs for a component, including handling defaults
-
-    #     Arguments:
-    #         x_inputs (list(pd.DataFrame)): Data to be used as X input for a component
-    #         y_input (pd.Series, None): If present, the Series to use as y input for a component, different from the original y
-    #         X (pd.DataFrame): The original X input, to be used if there is no parent X input
-    #         y (pd.Series): The original y input, to be used if there is no parent y input
-
-    #     Returns:
-    #         pd.DataFrame, pd.Series: The X and y transformed values to evaluate a component with
-    #     """
-
-    #     if len(x_inputs) == 0:
-    #         return_x = X
-    #     else:
-    #         return_x = pd.concat([x_in.to_dataframe() if isinstance(x_in, ww.DataTable) else x_in for x_in in x_inputs], axis=1)
-    #     return_y = y
-    #     if y_input is not None:
-    #         return_y = y_input
-    #     return return_x, return_y
 
     @staticmethod
     def _consolidate_inputs(x_inputs, y_input, X, y):
@@ -292,16 +259,6 @@ def _consolidate_inputs(x_inputs, y_input, X, y):
         if len(x_inputs) == 0:
             return_x = X
         else:
-            # x_to_concat = []
-            # for x_in in x_inputs:
-            #     if isinstance(x_in, ww.DataTable):
-            #         merged_types_dict.update(x_in.logical_types)
-            #         x_to_concat.append(x_in.to_dataframe())
-            #     elif isinstance(x_in, ww.DataColumn):
-            #         # following what was previously here, but could probs be simplified.
-            #         x_to_concat.append(pd.DataFrame(x_in.to_series(), columns=[parent_input]))
-            #     else:  # shouldnt reach here.
-            #         x_to_concat.append(x_in)
             return_x = pd.concat(x_inputs, axis=1)
         return_y = y
         if y_input is not None:
diff --git a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
index 74b12ed986..c087a5d95f 100644
--- a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
+++ b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
@@ -57,12 +57,13 @@ def fit(self, X, y=None):
     def predict(self, X, y=None):
         if y is None:
             raise ValueError("Cannot predict Time Series Baseline Estimator if y is None")
+        # TODO indices issue here?
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
 
         if self.gap == 0:
             y = y.shift(periods=1)
-
+        
         return _convert_to_woodwork_structure(y)
 
     def predict_proba(self, X, y=None):
@@ -70,10 +71,11 @@ def predict_proba(self, X, y=None):
             raise ValueError("Cannot predict Time Series Baseline Estimator if y is None")
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
-        preds = self.predict(X, y).dropna(axis=0, how='any').astype('int')
+        preds = self.predict(X, y).to_series().dropna(axis=0, how='any').astype('int')
         proba_arr = np.zeros((len(preds), y.max() + 1))
         proba_arr[np.arange(len(preds)), preds] = 1
-        return pad_with_nans(pd.DataFrame(proba_arr), len(y) - len(preds))
+        padded = pad_with_nans(pd.DataFrame(proba_arr), len(y) - len(preds))
+        return _convert_to_woodwork_structure(padded)
 
     @property
     def feature_importance(self):
diff --git a/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py b/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py
index 41f1f5f3c2..e58892a6f3 100644
--- a/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py
+++ b/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py
@@ -9,7 +9,7 @@
     TimeSeriesBaselineBinaryPipeline,
     TimeSeriesBaselineMulticlassPipeline
 )
-
+from pandas.testing import assert_series_equal, assert_frame_equal
 
 @pytest.mark.parametrize('X_none', [True, False])
 @pytest.mark.parametrize('gap', [0, 1])
@@ -24,7 +24,7 @@ def test_time_series_baseline(pipeline_class, gap, X_none, ts_data):
     if X_none:
         X = None
     clf.fit(X, y)
-    np.testing.assert_allclose(clf.predict(X, y), expected_y)
+    assert_series_equal(expected_y, clf.predict(X, y).to_series())
 
 
 @pytest.mark.parametrize('X_none', [True, False])
@@ -33,13 +33,13 @@ def test_time_series_baseline(pipeline_class, gap, X_none, ts_data):
 def test_time_series_baseline_predict_proba(pipeline_class, gap, X_none):
     X = pd.DataFrame({"a": [4, 5, 6, 7, 8]})
     y = pd.Series([0, 1, 1, 0, 1])
-    expected_proba = pd.DataFrame({0: [1, 0, 0, 1, 0],
-                                   1: [0, 1, 1, 0, 1]})
+    expected_proba = pd.DataFrame({0: pd.Series([1, 0, 0, 1, 0], dtype="float64"),
+                                   1: pd.Series([0, 1, 1, 0, 1], dtype="float64")})
     if pipeline_class == TimeSeriesBaselineMulticlassPipeline:
         y = pd.Series([0, 1, 2, 2, 1])
-        expected_proba = pd.DataFrame({0: [1, 0, 0, 0, 0],
-                                       1: [0, 1, 0, 0, 1],
-                                       2: [0, 0, 1, 1, 0]})
+        expected_proba = pd.DataFrame({0: pd.Series([1, 0, 0, 0, 0], dtype="float64"),
+                                       1: pd.Series([0, 1, 0, 0, 1], dtype="float64"),
+                                       2: pd.Series([0, 0, 1, 1, 0], dtype="float64")})
     if gap == 0:
         # Shift to pad the first row with Nans
         expected_proba = expected_proba.shift(1)
@@ -49,7 +49,7 @@ def test_time_series_baseline_predict_proba(pipeline_class, gap, X_none):
     if X_none:
         X = None
     clf.fit(X, y)
-    np.testing.assert_allclose(clf.predict_proba(X, y), expected_proba)
+    assert_frame_equal(expected_proba, clf.predict_proba(X, y).to_dataframe())
 
 
 @pytest.mark.parametrize('pipeline_class', [TimeSeriesBaselineRegressionPipeline,

From b90f9156f6a45c5eea9251dbcb196a35396e716d Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 15 Jan 2021 15:56:36 -0500
Subject: [PATCH 48/98] fix tests

---
 docs/source/user_guide/pipelines.ipynb        |  4 +-
 evalml/pipelines/component_graph.py           |  5 +--
 .../time_series_baseline_estimator.py         |  2 +-
 .../time_series_classification_pipelines.py   |  2 -
 .../pipeline_tests/test_component_graph.py    | 42 ++++++++++++-------
 .../test_time_series_baseline_pipeline.py     |  3 +-
 6 files changed, 34 insertions(+), 24 deletions(-)

diff --git a/docs/source/user_guide/pipelines.ipynb b/docs/source/user_guide/pipelines.ipynb
index 89d245cc72..dc87764e83 100644
--- a/docs/source/user_guide/pipelines.ipynb
+++ b/docs/source/user_guide/pipelines.ipynb
@@ -455,9 +455,9 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.5"
+   "version": "3.8.6"
   }
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
+}
\ No newline at end of file
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 60e6c56c59..62159bc7a1 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -206,10 +206,10 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                     parent_x = output_cache.get(parent_input, output_cache.get(f'{parent_input}.x'))
                     if isinstance(parent_x, ww.DataTable):
                         merged_types_dict.update(parent_x.logical_types)
-                        parent_x = parent_x.to_dataframe()
+                        parent_x = _convert_woodwork_types_wrapper(parent_x.to_dataframe())
                     elif isinstance(parent_x, ww.DataColumn):
                         # following what was previously here, but could probs be simplified.
-                        parent_x = pd.DataFrame(parent_x.to_series(), columns=[parent_input])
+                        parent_x = pd.DataFrame(_convert_woodwork_types_wrapper(parent_x.to_series()), columns=[parent_input])
                     x_inputs.append(parent_x)
             input_x, input_y = self._consolidate_inputs(x_inputs, y_input, X, y)
             for t in original_logical_types:
@@ -240,7 +240,6 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                 output_cache[component_name] = output
         return output_cache
 
-
     @staticmethod
     def _consolidate_inputs(x_inputs, y_input, X, y):
         """ Combines any/all X and y inputs for a component, including handling defaults
diff --git a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
index c087a5d95f..e6221ed814 100644
--- a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
+++ b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
@@ -63,7 +63,7 @@ def predict(self, X, y=None):
 
         if self.gap == 0:
             y = y.shift(periods=1)
-        
+
         return _convert_to_woodwork_structure(y)
 
     def predict_proba(self, X, y=None):
diff --git a/evalml/pipelines/time_series_classification_pipelines.py b/evalml/pipelines/time_series_classification_pipelines.py
index d6cbb2890e..9be27e10c3 100644
--- a/evalml/pipelines/time_series_classification_pipelines.py
+++ b/evalml/pipelines/time_series_classification_pipelines.py
@@ -131,8 +131,6 @@ def predict(self, X, y=None, objective=None):
         padded = pad_with_nans(predictions, max(0, n_features - predictions.shape[0]))
         return _convert_to_woodwork_structure(padded)
 
-
-
     def predict_proba(self, X, y=None):
         """Make probability estimates for labels.
 
diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index 8e66ee7176..885e78330a 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -368,9 +368,9 @@ def test_fit_correct_inputs(mock_ohe_transform, mock_imputer_fit_transform, X_y_
     mock_ohe_transform.return_value = expected_x
     component_graph = ComponentGraph(graph).instantiate({})
     component_graph.fit(X, y)
-    ### TODO
-    assert_frame_equal(mock_ohe_transform.call_args[0][0], expected_x.to_dataframe())
-    assert_series_equal(mock_ohe_transform.call_args[0][1].to_series(), expected_y.to_series())
+
+    assert_frame_equal(expected_x.to_dataframe(), mock_ohe_transform.call_args[0][0].to_dataframe())
+    assert_series_equal(expected_y.to_series(), mock_ohe_transform.call_args[0][1].to_series())
 
 
 @patch('evalml.pipelines.components.Transformer.fit_transform')
@@ -603,12 +603,12 @@ def test_computation_input_custom_index(index):
 @patch(f'{__name__}.TransformerA.transform')
 def test_component_graph_evaluation_plumbing(mock_transa, mock_transb, mock_transc, mock_preda, mock_predb, mock_predc, dummy_components):
     TransformerA, TransformerB, TransformerC, EstimatorA, EstimatorB, EstimatorC = dummy_components
-    mock_transa.return_value = pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6)})
-    mock_transb.return_value = pd.DataFrame({'feature b': np.ones(6) * 2})
-    mock_transc.return_value = pd.DataFrame({'feature c': np.ones(6) * 3})
-    mock_preda.return_value = pd.Series([0, 0, 0, 1, 0, 0])
-    mock_predb.return_value = pd.Series([0, 0, 0, 0, 1, 0])
-    mock_predc.return_value = pd.Series([0, 0, 0, 0, 0, 1])
+    mock_transa.return_value = ww.DataTable(pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6)}))
+    mock_transb.return_value = ww.DataTable(pd.DataFrame({'feature b': np.ones(6) * 2}))
+    mock_transc.return_value = ww.DataTable(pd.DataFrame({'feature c': np.ones(6) * 3}))
+    mock_preda.return_value = ww.DataColumn(pd.Series([0, 0, 0, 1, 0, 0]))
+    mock_predb.return_value = ww.DataColumn(pd.Series([0, 0, 0, 0, 1, 0]))
+    mock_predc.return_value = ww.DataColumn(pd.Series([0, 0, 0, 0, 0, 1]))
     graph = {
         'transformer a': [TransformerA],
         'transformer b': [TransformerB, 'transformer a'],
@@ -624,12 +624,24 @@ def test_component_graph_evaluation_plumbing(mock_transa, mock_transb, mock_tran
     component_graph.fit(X, y)
     predict_out = component_graph.predict(X)
 
-    assert_frame_equal(mock_transa.call_args[0][0], X)
-    assert_frame_equal(mock_transb.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6)}, columns=['feature trans', 'feature a']))
-    assert_frame_equal(mock_transc.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6), 'feature b': np.ones(6) * 2}, columns=['feature trans', 'feature a', 'feature b']))
-    assert_frame_equal(mock_preda.call_args[0][0], X)
-    assert_frame_equal(mock_predb.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6)}, columns=['feature trans', 'feature a']))
-    assert_frame_equal(mock_predc.call_args[0][0], pd.DataFrame({'feature trans': [1, 0, 0, 0, 0, 0], 'feature a': np.ones(6), 'estimator a': [0, 0, 0, 1, 0, 0], 'feature b': np.ones(6) * 2, 'estimator b': [0, 0, 0, 0, 1, 0], 'feature c': np.ones(6) * 3}, columns=['feature trans', 'feature a', 'estimator a', 'feature b', 'estimator b', 'feature c']))
+    assert_frame_equal(mock_transa.call_args[0][0].to_dataframe(), X)
+    assert_frame_equal(mock_transb.call_args[0][0].to_dataframe(), pd.DataFrame({'feature trans': pd.Series([1, 0, 0, 0, 0, 0], dtype="Int64"),
+                                                                                 'feature a': np.ones(6)}, columns=['feature trans', 'feature a']))
+    assert_frame_equal(mock_transc.call_args[0][0].to_dataframe(), pd.DataFrame({'feature trans': pd.Series([1, 0, 0, 0, 0, 0], dtype="Int64"),
+                                                                                 'feature a': np.ones(6),
+                                                                                 'feature b': np.ones(6) * 2},
+                                                                                columns=['feature trans', 'feature a', 'feature b']))
+    assert_frame_equal(mock_preda.call_args[0][0].to_dataframe(), X)
+    assert_frame_equal(mock_predb.call_args[0][0].to_dataframe(), pd.DataFrame({'feature trans': pd.Series([1, 0, 0, 0, 0, 0], dtype="Int64"),
+                                                                                'feature a': np.ones(6)},
+                                                                               columns=['feature trans', 'feature a']))
+    assert_frame_equal(mock_predc.call_args[0][0].to_dataframe(), pd.DataFrame({'feature trans': pd.Series([1, 0, 0, 0, 0, 0], dtype="Int64"),
+                                                                                'feature a': np.ones(6),
+                                                                                'estimator a': pd.Series([0, 0, 0, 1, 0, 0], dtype="Int64"),
+                                                                                'feature b': np.ones(6) * 2,
+                                                                                'estimator b': pd.Series([0, 0, 0, 0, 1, 0], dtype="Int64"),
+                                                                                'feature c': np.ones(6) * 3},
+                                                                               columns=['feature trans', 'feature a', 'estimator a', 'feature b', 'estimator b', 'feature c']))
     assert_series_equal(pd.Series([0, 0, 0, 0, 0, 1], dtype="Int64"), predict_out.to_series())
 
 
diff --git a/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py b/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py
index e58892a6f3..3e568dc699 100644
--- a/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py
+++ b/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py
@@ -3,13 +3,14 @@
 import numpy as np
 import pandas as pd
 import pytest
+from pandas.testing import assert_frame_equal, assert_series_equal
 
 from evalml.pipelines import TimeSeriesBaselineRegressionPipeline
 from evalml.pipelines.time_series_baselines import (
     TimeSeriesBaselineBinaryPipeline,
     TimeSeriesBaselineMulticlassPipeline
 )
-from pandas.testing import assert_series_equal, assert_frame_equal
+
 
 @pytest.mark.parametrize('X_none', [True, False])
 @pytest.mark.parametrize('gap', [0, 1])

From 03662c68c7e75c4cca4d098f5c87908ad1736c23 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 15 Jan 2021 16:14:57 -0500
Subject: [PATCH 49/98] a bit of cleanup

---
 docs/source/release_notes.rst                               | 2 +-
 docs/source/user_guide/pipelines.ipynb                      | 4 +---
 evalml/model_understanding/graphs.py                        | 1 +
 .../prediction_explanations/explainers.py                   | 6 ++----
 evalml/objectives/objective_base.py                         | 1 -
 evalml/pipelines/classification_pipeline.py                 | 3 ---
 evalml/pipelines/component_graph.py                         | 1 -
 .../components/estimators/regressors/xgboost_regressor.py   | 2 +-
 .../components/transformers/scalers/standard_scaler.py      | 1 -
 9 files changed, 6 insertions(+), 15 deletions(-)

diff --git a/docs/source/release_notes.rst b/docs/source/release_notes.rst
index e5e68b4267..c32a84b12c 100644
--- a/docs/source/release_notes.rst
+++ b/docs/source/release_notes.rst
@@ -42,7 +42,7 @@ Release Notes
 
     **Breaking Changes**
         * Removed ``has_searched`` property from ``AutoMLSearch`` :pr:`1647`
-        * Components and pipelines return ``Woodwork`` data structures instead of pandas data structures :pr:`1668`
+        * Components and pipelines return ``Woodwork`` data structures instead of ``pandas`` data structures :pr:`1668`
 
 **v0.17.0 Dec. 29, 2020**
     * Enhancements
diff --git a/docs/source/user_guide/pipelines.ipynb b/docs/source/user_guide/pipelines.ipynb
index dc87764e83..cc48817c3c 100644
--- a/docs/source/user_guide/pipelines.ipynb
+++ b/docs/source/user_guide/pipelines.ipynb
@@ -357,9 +357,7 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "metadata": {
-    "scrolled": false
-   },
+   "metadata": {},
    "outputs": [],
    "source": [
     "from evalml.pipelines.utils import generate_pipeline_code\n",
diff --git a/evalml/model_understanding/graphs.py b/evalml/model_understanding/graphs.py
index 251d3db52f..5ea3a8fd3d 100644
--- a/evalml/model_understanding/graphs.py
+++ b/evalml/model_understanding/graphs.py
@@ -465,6 +465,7 @@ def partial_dependence(pipeline, X, feature, grid_resolution=100):
 
     if ((isinstance(feature, int) and X.iloc[:, feature].isnull().sum()) or (isinstance(feature, str) and X[feature].isnull().sum())):
         warnings.warn("There are null values in the features, which will cause NaN values in the partial dependence output. Fill in these values to remove the NaN values.", NullsInColumnWarning)
+
     wrapped = scikit_learn_wrapped_estimator(pipeline)
     if isinstance(pipeline, evalml.pipelines.ClassificationPipeline):
         wrapped._estimator_type = "classifier"
diff --git a/evalml/model_understanding/prediction_explanations/explainers.py b/evalml/model_understanding/prediction_explanations/explainers.py
index 4d1e3850d3..816f9bb86b 100644
--- a/evalml/model_understanding/prediction_explanations/explainers.py
+++ b/evalml/model_understanding/prediction_explanations/explainers.py
@@ -173,13 +173,11 @@ def explain_predictions_best_worst(pipeline, input_features, y_true, num_to_expl
 
     try:
         if pipeline.problem_type == ProblemTypes.REGRESSION:
-            y_pred = pipeline.predict(input_features)
-            y_pred = y_pred.to_series()
+            y_pred = pipeline.predict(input_features).to_series()
             y_pred_values = None
             errors = metric(y_true, y_pred)
         else:
-            y_pred = pipeline.predict_proba(input_features)
-            y_pred = y_pred.to_dataframe()
+            y_pred = pipeline.predict_proba(input_features).to_dataframe()
             y_pred_values = pipeline.predict(input_features)
             y_pred_values = y_pred_values.to_series()
             errors = metric(pipeline._encode_targets(y_true), y_pred)
diff --git a/evalml/objectives/objective_base.py b/evalml/objectives/objective_base.py
index ec0d634e08..4d004676b7 100644
--- a/evalml/objectives/objective_base.py
+++ b/evalml/objectives/objective_base.py
@@ -114,7 +114,6 @@ def validate_inputs(self, y_true, y_predicted):
             raise ValueError("y_true contains NaN or infinity")
         # y_predicted could be a 1d vector (predictions) or a 2d vector (classifier predicted probabilities)
         y_pred_flat = y_predicted.to_numpy().flatten()
-
         if np.isnan(y_pred_flat).any() or np.isinf(y_pred_flat).any():
             raise ValueError("y_predicted contains NaN or infinity")
         if self.score_needs_proba and np.any([(y_pred_flat < 0) | (y_pred_flat > 1)]):
diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index ee2352e897..eadeddc1e9 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -39,7 +39,6 @@ def fit(self, X, y):
             self
 
         """
-        # import pdb; pdb.set_trace()
         X = _convert_to_woodwork_structure(X)
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
@@ -80,7 +79,6 @@ def _predict(self, X, objective=None):
             pd.Series: Estimated labels
         """
         # why does this not use objectives... because multiclass doesnt? so maybe this should be moved for less confusion
-        # import pdb; pdb.set_trace()
         return self._component_graph.predict(X)
 
     def predict(self, X, objective=None):
@@ -93,7 +91,6 @@ def predict(self, X, objective=None):
         Returns:
             pd.Series : Estimated labels
         """
-        # import pdb; pdb.set_trace()
         predictions = self._predict(X, objective)
         predictions = predictions.to_series()
         predictions = pd.Series(self._decode_targets(predictions), name=self.input_target_name)
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 62159bc7a1..ee6434d151 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -91,7 +91,6 @@ def fit(self, X, y):
             X (pd.DataFrame): The input training data of shape [n_samples, n_features]
             y (pd.Series): The target training data of length [n_samples]
         """
-        # import pdb; pdb.set_trace()
         self._compute_features(self.compute_order, X, y, fit=True)
         return self
 
diff --git a/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py b/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
index f354bf7bcc..8b7a26da8a 100644
--- a/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
@@ -50,7 +50,7 @@ def fit(self, X, y=None):
     def predict(self, X):
         X = _rename_column_names_to_numeric(X)
         predictions = super().predict(X)
-        predictions = _convert_to_woodwork_structure(predictions)
+        predictions = _convert_to_woodwork_structure(predictions)  # UNNECESSARY?
         return predictions
 
     @property
diff --git a/evalml/pipelines/components/transformers/scalers/standard_scaler.py b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
index b5d7709c1d..b4f1a364dd 100644
--- a/evalml/pipelines/components/transformers/scalers/standard_scaler.py
+++ b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
@@ -30,7 +30,6 @@ def transform(self, X, y=None):
         X_index = X.index
         X_t = self._component_obj.transform(X)
         X_t_df = pd.DataFrame(X_t, columns=X_cols, index=X_index)
-        # import pdb; pdb.set_trace()
         return _convert_to_woodwork_structure(X_t_df)
 
     def fit_transform(self, X, y=None):

From 4425ad7086c97c6f649457982ff6ca038716893d Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 15 Jan 2021 17:43:04 -0500
Subject: [PATCH 50/98] fix tests

---
 evalml/tests/pipeline_tests/test_component_graph.py          | 2 +-
 .../pipeline_tests/test_time_series_baseline_pipeline.py     | 5 ++---
 2 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index 885e78330a..ef74fd2d08 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -455,7 +455,7 @@ def test_predict_repeat_estimator(mock_predict, mock_fit, X_y_binary):
 def test_compute_final_component_features_linear(mock_ohe, mock_imputer, X_y_binary):
     X, y = X_y_binary
     X = pd.DataFrame(X)
-    X_expected = pd.DataFrame(index=X.index, columns=X.columns).fillna(0)
+    X_expected = X.fillna(0)
     mock_imputer.return_value = ww.DataTable(X)
     mock_ohe.return_value = ww.DataTable(X_expected)
 
diff --git a/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py b/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py
index 3e568dc699..0a170d4f3b 100644
--- a/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py
+++ b/evalml/tests/pipeline_tests/test_time_series_baseline_pipeline.py
@@ -3,7 +3,6 @@
 import numpy as np
 import pandas as pd
 import pytest
-from pandas.testing import assert_frame_equal, assert_series_equal
 
 from evalml.pipelines import TimeSeriesBaselineRegressionPipeline
 from evalml.pipelines.time_series_baselines import (
@@ -25,7 +24,7 @@ def test_time_series_baseline(pipeline_class, gap, X_none, ts_data):
     if X_none:
         X = None
     clf.fit(X, y)
-    assert_series_equal(expected_y, clf.predict(X, y).to_series())
+    np.testing.assert_equal(expected_y.values, clf.predict(X, y).to_series().values)
 
 
 @pytest.mark.parametrize('X_none', [True, False])
@@ -50,7 +49,7 @@ def test_time_series_baseline_predict_proba(pipeline_class, gap, X_none):
     if X_none:
         X = None
     clf.fit(X, y)
-    assert_frame_equal(expected_proba, clf.predict_proba(X, y).to_dataframe())
+    pd.testing.assert_frame_equal(expected_proba, clf.predict_proba(X, y).to_dataframe())
 
 
 @pytest.mark.parametrize('pipeline_class', [TimeSeriesBaselineRegressionPipeline,

From 0295348408aad8dee84df90540c70e9504e0f992 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 15 Jan 2021 18:18:34 -0500
Subject: [PATCH 51/98] remove catboost changes from this branch

---
 .../components/estimators/classifiers/catboost_classifier.py  | 4 ++--
 .../components/estimators/regressors/catboost_regressor.py    | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py b/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
index ee3d6d8ddd..752d6f9529 100644
--- a/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
@@ -70,8 +70,8 @@ def fit(self, X, y=None):
         if y.nunique() <= 2:
             self._label_encoder = LabelEncoder()
             y = pd.Series(self._label_encoder.fit_transform(y))
-        self._component_obj.fit(X, y, silent=True, cat_features=cat_cols)
-        return self
+        model = self._component_obj.fit(X, y, silent=True, cat_features=cat_cols)
+        return model
 
     def predict(self, X):
         X = _convert_to_woodwork_structure(X)
diff --git a/evalml/pipelines/components/estimators/regressors/catboost_regressor.py b/evalml/pipelines/components/estimators/regressors/catboost_regressor.py
index 9ddda1c733..505cff948a 100644
--- a/evalml/pipelines/components/estimators/regressors/catboost_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/catboost_regressor.py
@@ -62,8 +62,8 @@ def fit(self, X, y=None):
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
 
-        self._component_obj.fit(X, y, silent=True, cat_features=cat_cols)
-        return self
+        model = self._component_obj.fit(X, y, silent=True, cat_features=cat_cols)
+        return model
 
     @property
     def feature_importance(self):

From 326b55009c214a84a9131159ac39cece30f2d1af Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 15 Jan 2021 18:35:17 -0500
Subject: [PATCH 52/98] cleanup some comments

---
 evalml/pipelines/component_graph.py           |  2 +-
 evalml/tests/pipeline_tests/test_pipelines.py | 14 +++++++-------
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index ee6434d151..01ae00bb21 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -100,7 +100,7 @@ def fit_features(self, X, y):
         Arguments:
             X (pd.DataFrame): The input training data of shape [n_samples, n_features]
             y (pd.Series): The target training data of length [n_samples]
-        
+
         Returns:
             ww.DataTable
         """
diff --git a/evalml/tests/pipeline_tests/test_pipelines.py b/evalml/tests/pipeline_tests/test_pipelines.py
index c8d3a5b7ca..63f3668b19 100644
--- a/evalml/tests/pipeline_tests/test_pipelines.py
+++ b/evalml/tests/pipeline_tests/test_pipelines.py
@@ -1082,17 +1082,17 @@ def test_compute_estimator_features(mock_scaler, mock_ohe, mock_imputer, X_y_bin
 @patch('evalml.pipelines.components.ElasticNetClassifier.predict')
 def test_compute_estimator_features_nonlinear(mock_en_predict, mock_rf_predict, mock_ohe, mock_imputer, X_y_binary, nonlinear_binary_pipeline_class):
     X, y = X_y_binary
-    ### TODO: can clean
-    mock_imputer.return_value = ww.DataTable(pd.DataFrame(X))
-    mock_ohe.return_value = ww.DataTable(pd.DataFrame(X))
-    mock_en_predict.return_value = ww.DataColumn(pd.Series(np.ones(X.shape[0])))
-    mock_rf_predict.return_value = ww.DataColumn(pd.Series(np.zeros(X.shape[0])))
-    X_expected = pd.DataFrame({'Random Forest': np.zeros(X.shape[0]), 'Elastic Net': np.ones(X.shape[0])})
+    mock_imputer.return_value = ww.DataTable(X)
+    mock_ohe.return_value = ww.DataTable(X)
+    mock_en_predict.return_value = ww.DataColumn(np.ones(X.shape[0]))
+    mock_rf_predict.return_value = ww.DataColumn(np.zeros(X.shape[0]))
+    X_expected_df = pd.DataFrame({'Random Forest': np.zeros(X.shape[0]), 'Elastic Net': np.ones(X.shape[0])})
 
     pipeline = nonlinear_binary_pipeline_class({})
     pipeline.fit(X, y)
     X_t = pipeline.compute_estimator_features(X)
-    assert_frame_equal(X_expected, X_t.to_dataframe())
+
+    assert_frame_equal(X_expected_df, X_t.to_dataframe())
     assert mock_imputer.call_count == 2
     assert mock_ohe.call_count == 4
     assert mock_en_predict.call_count == 2

From d6fec28e0c78c6272a81be97a20276a25e4a89dc Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 15 Jan 2021 18:48:17 -0500
Subject: [PATCH 53/98] clean up some estimators

---
 .../estimators/classifiers/baseline_classifier.py         | 7 +------
 .../estimators/classifiers/xgboost_classifier.py          | 8 ++------
 .../estimators/regressors/baseline_regressor.py           | 2 --
 .../components/estimators/regressors/xgboost_regressor.py | 4 +---
 evalml/tests/component_tests/test_xgboost_classifier.py   | 1 +
 5 files changed, 5 insertions(+), 17 deletions(-)

diff --git a/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py b/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
index 5ea99f1953..a8eaa04c3c 100644
--- a/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
@@ -45,7 +45,6 @@ def fit(self, X, y=None):
         if y is None:
             raise ValueError("Cannot fit Baseline classifier if y is None")
         X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
 
@@ -61,7 +60,6 @@ def fit(self, X, y=None):
 
     def predict(self, X):
         X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
         strategy = self.parameters["strategy"]
         if strategy == "mode":
             predictions = pd.Series([self._mode] * len(X))
@@ -73,18 +71,15 @@ def predict(self, X):
 
     def predict_proba(self, X):
         X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
         strategy = self.parameters["strategy"]
         if strategy == "mode":
             mode_index = self._classes.index(self._mode)
             proba_arr = np.array([[1.0 if i == mode_index else 0.0 for i in range(self._num_unique)]] * len(X))
-            predictions = pd.DataFrame(proba_arr, columns=self._classes)
         elif strategy == "random":
             proba_arr = np.array([[1.0 / self._num_unique for i in range(self._num_unique)]] * len(X))
-            predictions = pd.DataFrame(proba_arr, columns=self._classes)
         else:
             proba_arr = np.array([[self._percentage_freq[i] for i in range(self._num_unique)]] * len(X))
-            predictions = pd.DataFrame(proba_arr, columns=self._classes)
+        predictions = pd.DataFrame(proba_arr, columns=self._classes)
         return _convert_to_woodwork_structure(predictions)
 
     @property
diff --git a/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py b/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py
index e1591c3a09..e3246ac10d 100644
--- a/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py
@@ -50,15 +50,11 @@ def fit(self, X, y=None):
 
     def predict(self, X):
         X = _rename_column_names_to_numeric(X)
-        predictions = super().predict(X)
-        predictions = _convert_to_woodwork_structure(predictions)
-        return predictions
+        return super().predict(X)
 
     def predict_proba(self, X):
         X = _rename_column_names_to_numeric(X)
-        pred_proba = super().predict_proba(X)
-        pred_proba = _convert_to_woodwork_structure(pred_proba)
-        return pred_proba
+        return super().predict_proba(X)
 
     @property
     def feature_importance(self):
diff --git a/evalml/pipelines/components/estimators/regressors/baseline_regressor.py b/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
index e0f7984612..2c3b2d9723 100644
--- a/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
@@ -43,7 +43,6 @@ def fit(self, X, y=None):
         if y is None:
             raise ValueError("Cannot fit Baseline regressor if y is None")
         X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
 
@@ -56,7 +55,6 @@ def fit(self, X, y=None):
 
     def predict(self, X):
         X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
         predictions = pd.Series([self._prediction_value] * len(X))
         return _convert_to_woodwork_structure(predictions)
 
diff --git a/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py b/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
index 8b7a26da8a..5660bf4f11 100644
--- a/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
@@ -49,9 +49,7 @@ def fit(self, X, y=None):
 
     def predict(self, X):
         X = _rename_column_names_to_numeric(X)
-        predictions = super().predict(X)
-        predictions = _convert_to_woodwork_structure(predictions)  # UNNECESSARY?
-        return predictions
+        return super().predict(X)
 
     @property
     def feature_importance(self):
diff --git a/evalml/tests/component_tests/test_xgboost_classifier.py b/evalml/tests/component_tests/test_xgboost_classifier.py
index d6d76b1e12..ec49e237cc 100644
--- a/evalml/tests/component_tests/test_xgboost_classifier.py
+++ b/evalml/tests/component_tests/test_xgboost_classifier.py
@@ -61,6 +61,7 @@ def test_xgboost_feature_name_with_random_ascii(problem_type, X_y_binary, X_y_mu
     X = clf.random_state.random((X.shape[0], len(string.printable)))
     col_names = ['column_{}'.format(ascii_char) for ascii_char in string.printable]
     X = pd.DataFrame(X, columns=col_names)
+
     clf.fit(X, y)
     predictions = clf.predict(X)
     assert len(predictions) == len(y)

From 95f11f7c19862f5b3fd40181e86c7e9b7aff29a9 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sat, 16 Jan 2021 00:02:16 -0500
Subject: [PATCH 54/98] more minor cleanup

---
 evalml/automl/automl_search.py           | 8 ++------
 evalml/pipelines/component_graph.py      | 5 -----
 evalml/tests/automl_tests/test_automl.py | 1 +
 3 files changed, 3 insertions(+), 11 deletions(-)

diff --git a/evalml/automl/automl_search.py b/evalml/automl/automl_search.py
index dbef6df947..eefe307066 100644
--- a/evalml/automl/automl_search.py
+++ b/evalml/automl/automl_search.py
@@ -572,12 +572,8 @@ def _tune_binary_threshold(self, pipeline, X_threshold_tuning, y_threshold_tunin
             pipeline.threshold = 0.5
             if X_threshold_tuning:
                 y_predict_proba = pipeline.predict_proba(X_threshold_tuning)
-                if isinstance(y_predict_proba, pd.DataFrame):
-                    y_predict_proba = y_predict_proba.iloc[:, 1]  # shouldnt need
-                elif isinstance(y_predict_proba, ww.DataTable):
-                    y_predict_proba = y_predict_proba.to_dataframe().iloc[:, 1]
-                else:
-                    y_predict_proba = y_predict_proba[:, 1]
+                # y_predict_proba = y_predict_proba.to_dataframe().iloc[:, 1]
+                y_predict_proba = y_predict_proba.iloc[:, 1]
                 pipeline.threshold = self.objective.optimize_threshold(y_predict_proba, y_threshold_tuning, X=X_threshold_tuning)
         return pipeline
 
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 01ae00bb21..65bed5a8f5 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -157,17 +157,12 @@ def compute_final_component_features(self, X, y=None):
         final_component_inputs = []
         for parent in self.get_parents(self.compute_order[-1]):
             parent_output = component_outputs.get(parent, component_outputs.get(f'{parent}.x'))
-            if isinstance(parent_output, pd.Series):
-                # shouldnt happen...
-                parent_output = pd.DataFrame(parent_output, columns=[parent])
             if isinstance(parent_output, ww.DataColumn):
                 parent_output = parent_output.to_series()
                 parent_output = pd.DataFrame(parent_output, columns=[parent])
                 parent_output = _convert_to_woodwork_structure(parent_output)
             final_component_inputs.append(parent_output)
-        # concatted = pd.concat([i.to_dataframe() for i in final_component_inputs], axis=1)
         concatted = pd.concat([i.to_dataframe() if isinstance(i, ww.DataTable) else i for i in final_component_inputs], axis=1)
-
         return _convert_to_woodwork_structure(concatted)
 
     def _compute_features(self, component_list, X, y=None, fit=False):
diff --git a/evalml/tests/automl_tests/test_automl.py b/evalml/tests/automl_tests/test_automl.py
index 800ef1665c..b6ee0e582a 100644
--- a/evalml/tests/automl_tests/test_automl.py
+++ b/evalml/tests/automl_tests/test_automl.py
@@ -307,6 +307,7 @@ def _dummy_callback(param1, param2, param3):
     assert "Search Results" not in str_rep
 
     mock_score.return_value = {automl.objective.name: 1.0}
+    mock_predict_proba.return_value = ww.DataTable(pd.DataFrame([[1.0, 0.0], [0.0, 1.0]]))
     automl.search()
     mock_fit.assert_called()
     mock_score.assert_called()

From cc95be13936bdab6511dcbd9229f1c8ead54b4e3 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sat, 16 Jan 2021 00:39:53 -0500
Subject: [PATCH 55/98] a little more cleanup

---
 .../prediction_explanations/_algorithms.py    |  4 ++--
 .../_user_interface.py                        |  3 +--
 .../prediction_explanations/explainers.py     |  3 +--
 evalml/pipelines/classification_pipeline.py   |  2 ++
 evalml/pipelines/component_graph.py           |  3 ---
 .../time_series_baseline_estimator.py         |  2 +-
 .../transformers/column_selectors.py          | 21 ++++++-------------
 7 files changed, 13 insertions(+), 25 deletions(-)

diff --git a/evalml/model_understanding/prediction_explanations/_algorithms.py b/evalml/model_understanding/prediction_explanations/_algorithms.py
index 15ef505df9..df462ffeb3 100644
--- a/evalml/model_understanding/prediction_explanations/_algorithms.py
+++ b/evalml/model_understanding/prediction_explanations/_algorithms.py
@@ -82,8 +82,8 @@ def _compute_shap_values(pipeline, features, training_data=None):
 
         # More than 100 datapoints can negatively impact runtime according to SHAP
         # https://github.com/slundberg/shap/blob/master/shap/explainers/kernel.py#L114
-        sampled_training_data_features = pipeline.compute_estimator_features(shap.sample(training_data, 100))
-        sampled_training_data_features = _convert_woodwork_types_wrapper(sampled_training_data_features.to_dataframe())
+        sampled_training_data_features = pipeline.compute_estimator_features(shap.sample(training_data, 100)).to_dataframe()
+        # sampled_training_data_features = _convert_woodwork_types_wrapper(sampled_training_data_features.to_dataframe())
         sampled_training_data_features = check_array(sampled_training_data_features)
 
         if pipeline.problem_type == ProblemTypes.REGRESSION:
diff --git a/evalml/model_understanding/prediction_explanations/_user_interface.py b/evalml/model_understanding/prediction_explanations/_user_interface.py
index 722f1beb6f..d12d67ee06 100644
--- a/evalml/model_understanding/prediction_explanations/_user_interface.py
+++ b/evalml/model_understanding/prediction_explanations/_user_interface.py
@@ -211,8 +211,7 @@ def _make_single_prediction_shap_table(pipeline, input_features, top_k=3, traini
     Returns:
         str: Table
     """
-    pipeline_features = pipeline.compute_estimator_features(input_features)
-    pipeline_features = pipeline_features.to_dataframe()
+    pipeline_features = pipeline.compute_estimator_features(input_features).to_dataframe()
     shap_values = _compute_shap_values(pipeline, pipeline_features, training_data)
     normalized_shap_values = _normalize_shap_values(shap_values)
 
diff --git a/evalml/model_understanding/prediction_explanations/explainers.py b/evalml/model_understanding/prediction_explanations/explainers.py
index 816f9bb86b..cbf5f741d8 100644
--- a/evalml/model_understanding/prediction_explanations/explainers.py
+++ b/evalml/model_understanding/prediction_explanations/explainers.py
@@ -178,8 +178,7 @@ def explain_predictions_best_worst(pipeline, input_features, y_true, num_to_expl
             errors = metric(y_true, y_pred)
         else:
             y_pred = pipeline.predict_proba(input_features).to_dataframe()
-            y_pred_values = pipeline.predict(input_features)
-            y_pred_values = y_pred_values.to_series()
+            y_pred_values = pipeline.predict(input_features).to_series()
             errors = metric(pipeline._encode_targets(y_true), y_pred)
     except Exception as e:
         tb = traceback.format_tb(sys.exc_info()[2])
diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index eadeddc1e9..b13e8a6f14 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -107,6 +107,8 @@ def predict_proba(self, X):
         """
         X = self.compute_estimator_features(X, y=None)
         proba = self.estimator.predict_proba(X).to_dataframe()
+        # proba = self.estimator.predict_proba(X)
+        # proba = proba.rename({old_name: new_name for old_name, new_name in zip(list(proba.columns.keys), self._encoder.classes_)})
         proba.columns = self._encoder.classes_
         return _convert_to_woodwork_structure(proba)
 
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 65bed5a8f5..0d2f828d1d 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -111,9 +111,6 @@ def fit_features(self, X, y):
         final_component_inputs = []
         for parent in self.get_parents(self.compute_order[-1]):
             parent_output = component_outputs.get(parent, component_outputs.get(f'{parent}.x'))
-            if isinstance(parent_output, pd.Series):
-                # this shouldnt happen anymore, datacolumn
-                parent_output = pd.DataFrame(parent_output, columns=[parent])
             if isinstance(parent_output, ww.DataColumn):
                 parent_output = parent_output.to_series()
                 parent_output = pd.DataFrame(parent_output, columns=[parent])
diff --git a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
index e6221ed814..d2130ccdf0 100644
--- a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
+++ b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
@@ -57,7 +57,6 @@ def fit(self, X, y=None):
     def predict(self, X, y=None):
         if y is None:
             raise ValueError("Cannot predict Time Series Baseline Estimator if y is None")
-        # TODO indices issue here?
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
 
@@ -71,6 +70,7 @@ def predict_proba(self, X, y=None):
             raise ValueError("Cannot predict Time Series Baseline Estimator if y is None")
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
+
         preds = self.predict(X, y).to_series().dropna(axis=0, how='any').astype('int')
         proba_arr = np.zeros((len(preds), y.max() + 1))
         proba_arr[np.arange(len(preds)), preds] = 1
diff --git a/evalml/pipelines/components/transformers/column_selectors.py b/evalml/pipelines/components/transformers/column_selectors.py
index 0fbea2c0de..c6ff2ff4ab 100644
--- a/evalml/pipelines/components/transformers/column_selectors.py
+++ b/evalml/pipelines/components/transformers/column_selectors.py
@@ -29,10 +29,7 @@ def __init__(self, columns=None, random_state=0, **kwargs):
     def _check_input_for_columns(self, X):
         cols = self.parameters.get("columns") or []
 
-        if isinstance(X, np.ndarray):
-            column_names = range(X.shape[1])
-        else:
-            column_names = X.columns
+        column_names = X.columns
 
         missing_cols = set(cols) - set(column_names)
         if missing_cols:
@@ -45,7 +42,7 @@ def _modify_columns(self, cols, X, y=None):
         """How the transformer modifies the columns of the input data."""
 
     def fit(self, X, y=None):
-        """'Fits' the transformer by checking if the column names are present in the dataset.
+        """'Fits the transformer by checking if column names are present in the dataset.
 
         Arguments:
             X (ww.DataTable, pd.DataFrame): Data to check.
@@ -54,22 +51,16 @@ def fit(self, X, y=None):
         Returns:
             self
         """
+        X = _convert_to_woodwork_structure(X)
         self._check_input_for_columns(X)
         return self
 
     def transform(self, X, y=None):
         X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
         self._check_input_for_columns(X)
-
         cols = self.parameters.get("columns") or []
-        cols = self._modify_columns(cols, X, y)
-        return _convert_to_woodwork_structure(cols)
-
-    def fit_transform(self, X, y=None):
-        # transform method already calls fit under the hood.
-        self.fit(X, y)
-        return self.transform(X, y)
+        modified_cols = self._modify_columns(cols, X, y)
+        return _convert_to_woodwork_structure(modified_cols)
 
 
 class DropColumns(ColumnSelector):
@@ -79,7 +70,7 @@ class DropColumns(ColumnSelector):
     needs_fitting = False
 
     def _modify_columns(self, cols, X, y=None):
-        return X.drop(columns=cols, axis=1)
+        return X.drop(columns=cols)
 
     def transform(self, X, y=None):
         """Transforms data X by dropping columns.

From a3fd671f469c1d4d4fc77276ce3ee46cb83e941e Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sat, 16 Jan 2021 01:05:56 -0500
Subject: [PATCH 56/98] even more cleanup

---
 evalml/automl/automl_search.py                |  1 -
 .../prediction_explanations/_algorithms.py    |  2 +-
 .../classifiers/xgboost_classifier.py         |  5 +--
 .../time_series_baseline_estimator.py         |  2 --
 .../regressors/xgboost_regressor.py           |  5 +--
 .../transformers/column_selectors.py          |  7 +----
 .../feature_selection/feature_selector.py     | 31 +++----------------
 .../preprocessing/featuretools.py             |  1 +
 evalml/pipelines/regression_pipeline.py       |  2 +-
 .../component_tests/test_feature_selectors.py |  6 ++--
 .../test_regression.py                        |  9 +++---
 .../test_time_series_pipeline.py              | 10 +++---
 evalml/utils/gen_utils.py                     |  1 +
 13 files changed, 24 insertions(+), 58 deletions(-)

diff --git a/evalml/automl/automl_search.py b/evalml/automl/automl_search.py
index eefe307066..3e274787f4 100644
--- a/evalml/automl/automl_search.py
+++ b/evalml/automl/automl_search.py
@@ -7,7 +7,6 @@
 import cloudpickle
 import numpy as np
 import pandas as pd
-import woodwork as ww
 from sklearn.model_selection import BaseCrossValidator
 
 from .pipeline_search_plots import PipelineSearchPlots
diff --git a/evalml/model_understanding/prediction_explanations/_algorithms.py b/evalml/model_understanding/prediction_explanations/_algorithms.py
index df462ffeb3..cfb40b49e6 100644
--- a/evalml/model_understanding/prediction_explanations/_algorithms.py
+++ b/evalml/model_understanding/prediction_explanations/_algorithms.py
@@ -6,7 +6,7 @@
 
 from evalml.model_family.model_family import ModelFamily
 from evalml.problem_types.problem_types import ProblemTypes
-from evalml.utils import _convert_woodwork_types_wrapper, get_logger
+from evalml.utils import get_logger
 
 logger = get_logger(__file__)
 
diff --git a/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py b/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py
index e3246ac10d..eb50e63d63 100644
--- a/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/xgboost_classifier.py
@@ -4,10 +4,7 @@
 from evalml.pipelines.components.estimators import Estimator
 from evalml.problem_types import ProblemTypes
 from evalml.utils import get_random_seed, import_or_raise
-from evalml.utils.gen_utils import (
-    _convert_to_woodwork_structure,
-    _rename_column_names_to_numeric
-)
+from evalml.utils.gen_utils import _rename_column_names_to_numeric
 
 
 class XGBoostClassifier(Estimator):
diff --git a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
index d2130ccdf0..79cdf957d2 100644
--- a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
+++ b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
@@ -49,8 +49,6 @@ def fit(self, X, y=None):
         if X is None:
             X = pd.DataFrame()
         X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
-
         self._num_features = X.shape[1]
         return self
 
diff --git a/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py b/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
index 5660bf4f11..4d4f3cf0be 100644
--- a/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/xgboost_regressor.py
@@ -4,10 +4,7 @@
 from evalml.pipelines.components.estimators import Estimator
 from evalml.problem_types import ProblemTypes
 from evalml.utils import get_random_seed, import_or_raise
-from evalml.utils.gen_utils import (
-    _convert_to_woodwork_structure,
-    _rename_column_names_to_numeric
-)
+from evalml.utils.gen_utils import _rename_column_names_to_numeric
 
 
 class XGBoostRegressor(Estimator):
diff --git a/evalml/pipelines/components/transformers/column_selectors.py b/evalml/pipelines/components/transformers/column_selectors.py
index c6ff2ff4ab..b93c255890 100644
--- a/evalml/pipelines/components/transformers/column_selectors.py
+++ b/evalml/pipelines/components/transformers/column_selectors.py
@@ -1,12 +1,7 @@
 from abc import abstractmethod
 
-import numpy as np
-
 from evalml.pipelines.components.transformers import Transformer
-from evalml.utils.gen_utils import (
-    _convert_to_woodwork_structure,
-    _convert_woodwork_types_wrapper
-)
+from evalml.utils.gen_utils import _convert_to_woodwork_structure
 
 
 class ColumnSelector(Transformer):
diff --git a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
index 748ead4040..1ed4c8d214 100644
--- a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
+++ b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
@@ -14,20 +14,20 @@ def get_names(self):
         """Get names of selected features.
 
         Returns:
-            list of the names of features selected
+            List of the names of features selected
         """
         selected_masks = self._component_obj.get_support()
         return [feature_name for (selected, feature_name) in zip(selected_masks, self.input_feature_names) if selected]
 
     def transform(self, X, y=None):
-        """Transforms data X by selecting features
+        """Transforms input data by selecting features.
 
         Arguments:
             X (pd.DataFrame): Data to transform
             y (pd.Series, optional): Target data
 
         Returns:
-            pd.DataFrame: Transformed X
+            ww.DataTable: Transformed X
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
@@ -36,31 +36,8 @@ def transform(self, X, y=None):
         try:
             X_t = self._component_obj.transform(X)
         except AttributeError:
-            raise RuntimeError("Transformer requires a transform method or a component_obj that implements transform")
-        X_dtypes = X.dtypes.to_dict()
-        selected_col_names = self.get_names()
-        col_types = {key: X_dtypes[key] for key in selected_col_names}
-        features = pd.DataFrame(X_t, columns=selected_col_names, index=X.index).astype(col_types)
-        return _convert_to_woodwork_structure(features)
-
-    def fit_transform(self, X, y=None):
-        """Fits feature selector on data X then transforms X by selecting features
-
-        Arguments:
-            X (pd.DataFrame): Data to fit and transform
-            y (pd.Series): Target data
+            raise RuntimeError("Feature selector requires a transform method or a component_obj that implements transform")
 
-        Returns:
-            pd.DataFrame: Transformed X
-        """
-        X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
-        self.input_feature_names = list(X.columns.values)
-
-        try:
-            X_t = self._component_obj.fit_transform(X, y)
-        except AttributeError:
-            raise RuntimeError("Transformer requires a fit_transform method or a component_obj that implements fit_transform")
         X_dtypes = X.dtypes.to_dict()
         selected_col_names = self.get_names()
         col_types = {key: X_dtypes[key] for key in selected_col_names}
diff --git a/evalml/pipelines/components/transformers/preprocessing/featuretools.py b/evalml/pipelines/components/transformers/preprocessing/featuretools.py
index ebcea8fa5d..683e9266e5 100644
--- a/evalml/pipelines/components/transformers/preprocessing/featuretools.py
+++ b/evalml/pipelines/components/transformers/preprocessing/featuretools.py
@@ -65,6 +65,7 @@ def transform(self, X, y=None):
         Arguments:
             X (ww.DataTable, pd.DataFrame or np.ndarray): The input training data to transform. Has shape [n_samples, n_features]
             y (ww.DataColumn, pd.Series, optional): Ignored.
+
         Returns:
             ww.DataTable: Feature matrix
         """
diff --git a/evalml/pipelines/regression_pipeline.py b/evalml/pipelines/regression_pipeline.py
index ad3d600d7c..7eaaf227f8 100644
--- a/evalml/pipelines/regression_pipeline.py
+++ b/evalml/pipelines/regression_pipeline.py
@@ -21,13 +21,13 @@ def fit(self, X, y):
 
         Returns:
             self
-
         """
         X = _convert_to_woodwork_structure(X)
         y = _convert_to_woodwork_structure(y)
         if "numeric" not in y.semantic_tags:
             raise ValueError(f"Regression pipeline can only handle numeric target data")
         y = _convert_woodwork_types_wrapper(y.to_series())
+
         self._fit(X, y)
         return self
 
diff --git a/evalml/tests/component_tests/test_feature_selectors.py b/evalml/tests/component_tests/test_feature_selectors.py
index e639fd75e8..02187bb145 100644
--- a/evalml/tests/component_tests/test_feature_selectors.py
+++ b/evalml/tests/component_tests/test_feature_selectors.py
@@ -49,11 +49,11 @@ class MockFeatureSelector(FeatureSelector):
         name = "Mock Feature Selector"
 
         def fit(self, X, y):
-            pass
+            return self
 
     mock_feature_selector = MockFeatureSelector()
     mock_feature_selector.fit(pd.DataFrame(), pd.Series())
-    with pytest.raises(RuntimeError, match="Transformer requires a transform method or a component_obj that implements transform"):
+    with pytest.raises(RuntimeError, match="Feature selector requires a transform method or a component_obj that implements transform"):
         mock_feature_selector.transform(pd.DataFrame())
-    with pytest.raises(RuntimeError, match="Transformer requires a fit_transform method or a component_obj that implements fit_transform"):
+    with pytest.raises(RuntimeError, match="Feature selector requires a transform method or a component_obj that implements transform"):
         mock_feature_selector.fit_transform(pd.DataFrame())
diff --git a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
index 10481b9b3a..a73bacebb3 100644
--- a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
+++ b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
@@ -29,13 +29,14 @@ def test_woodwork_regression_pipeline(linear_regression_pipeline_class):
 def test_custom_indices():
     # custom regression pipeline
     # don't need to use target encoder, which wont run on core dependencies true tests
-    class MyTargetPipeline(RegressionPipeline):
+    class MyPipeline(RegressionPipeline):
         component_graph = ['Imputer', 'One Hot Encoder', 'Linear Regressor']
-        custom_name = "Target Pipeline"
+        custom_name = "My Pipeline"
 
     X = pd.DataFrame({"a": ["a", "b", "a", "a", "a", "c", "c", "c"], "b": [0, 1, 1, 1, 1, 1, 0, 1]})
     y = pd.Series([0, 0, 0, 1, 0, 1, 0, 0], index=[7, 2, 1, 4, 5, 3, 6, 8])
 
     x1, x2, y1, y2 = split_data(X, y, problem_type='regression')
-    tp = MyTargetPipeline({})
-    tp.fit(x2, y2)
+    pipeline = MyPipeline({})
+    pipeline.fit(x2, y2)
+    assert not pd.isnull(pipeline.predict(X).to_series()).any()
diff --git a/evalml/tests/pipeline_tests/test_time_series_pipeline.py b/evalml/tests/pipeline_tests/test_time_series_pipeline.py
index f5bfb3ce07..3359d15957 100644
--- a/evalml/tests/pipeline_tests/test_time_series_pipeline.py
+++ b/evalml/tests/pipeline_tests/test_time_series_pipeline.py
@@ -258,8 +258,8 @@ class MyTsPipeline(pipeline_class):
                                                        (TimeSeriesMulticlassClassificationPipeline, ["MCC Multiclass", "Log Loss Multiclass"]),
                                                        (TimeSeriesRegressionPipeline, ['R2']),
                                                        (TimeSeriesRegressionPipeline, ['R2', "Mean Absolute Percentage Error"])])
-@pytest.mark.parametrize("use_ww", [True, False])
-def test_score_works(pipeline_class, objectives, use_ww, X_y_binary, X_y_multi, X_y_regression, make_data_type):
+@pytest.mark.parametrize("data_type", ["pd", "ww"])
+def test_score_works(pipeline_class, objectives, data_type, X_y_binary, X_y_multi, X_y_regression, make_data_type):
 
     preprocessing = ['Delayed Feature Transformer']
     if pipeline_class == TimeSeriesRegressionPipeline:
@@ -285,9 +285,9 @@ class Pipeline(pipeline_class):
         X, y = X_y_regression
         y = pd.Series(y)
         expected_unique_values = None
-    if use_ww:
-        X = make_data_type("ww", X)
-        y = make_data_type("ww", y)
+
+    X = make_data_type(data_type, X)
+    y = make_data_type(data_type, y)
 
     pl.fit(X, y)
     if expected_unique_values:
diff --git a/evalml/utils/gen_utils.py b/evalml/utils/gen_utils.py
index 31bc874053..26089772dd 100644
--- a/evalml/utils/gen_utils.py
+++ b/evalml/utils/gen_utils.py
@@ -339,6 +339,7 @@ def _convert_woodwork_types_wrapper(pd_data):
     nullable_to_numpy_mapping_nan = {pd.Int64Dtype: 'float64',
                                      pd.BooleanDtype: 'object',
                                      pd.StringDtype: 'object'}
+
     if isinstance(pd_data, pd.api.extensions.ExtensionArray):
         if pd.isna(pd_data).any():
             return pd.Series(pd_data.to_numpy(na_value=np.nan), dtype=nullable_to_numpy_mapping_nan[type(pd_data.dtype)])

From 37f80284aa5b1117fd7023a04647de08bd196649 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Sat, 16 Jan 2021 04:30:42 -0500
Subject: [PATCH 57/98] fix feature selector

---
 .../transformers/feature_selection/feature_selector.py         | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
index 1ed4c8d214..7690ee097a 100644
--- a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
+++ b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
@@ -43,3 +43,6 @@ def transform(self, X, y=None):
         col_types = {key: X_dtypes[key] for key in selected_col_names}
         features = pd.DataFrame(X_t, columns=selected_col_names, index=X.index).astype(col_types)
         return _convert_to_woodwork_structure(features)
+
+    def fit_transform(self, X, y=None):
+        return self.fit(X, y).transform(X, y)

From a7135745218c51fd258e4195699458f07804d416 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 19 Jan 2021 02:42:44 -0500
Subject: [PATCH 58/98] clean up and add durations flag to pytest

---
 Makefile                                      |  8 +++----
 .../time_series_baseline_estimator.py         |  1 -
 .../transformers/column_selectors.py          |  2 +-
 .../transformers/imputers/imputer.py          |  5 ++--
 .../transformers/imputers/simple_imputer.py   | 23 ++++++-------------
 .../preprocessing/datetime_featurizer.py      |  6 ++---
 .../preprocessing/drop_null_columns.py        |  2 --
 .../transformers/preprocessing/lsa.py         |  1 -
 evalml/pipelines/components/utils.py          | 16 ++++++-------
 evalml/tests/component_tests/test_lsa.py      |  4 ----
 10 files changed, 24 insertions(+), 44 deletions(-)

diff --git a/Makefile b/Makefile
index e14bbc0392..4ea75e6802 100644
--- a/Makefile
+++ b/Makefile
@@ -18,19 +18,19 @@ lint-fix:
 
 .PHONY: test
 test:
-	pytest evalml/ --doctest-modules --doctest-continue-on-failure
+	pytest evalml/ --doctest-modules --doctest-continue-on-failure --durations=0
 
 .PHONY: circleci-test
 circleci-test:
-	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v
+	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v --durations=0
 
 .PHONY: circleci-test-minimal-deps
 circleci-test-minimal-deps:
-	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v --has-minimal-dependencies
+	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v --has-minimal-dependencies --durations=0
 
 .PHONY: win-circleci-test
 win-circleci-test:
-	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v
+	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v --durations=0
 
 .PHONY: installdeps
 installdeps:
diff --git a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
index 79cdf957d2..d9307c34db 100644
--- a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
+++ b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
@@ -68,7 +68,6 @@ def predict_proba(self, X, y=None):
             raise ValueError("Cannot predict Time Series Baseline Estimator if y is None")
         y = _convert_to_woodwork_structure(y)
         y = _convert_woodwork_types_wrapper(y.to_series())
-
         preds = self.predict(X, y).to_series().dropna(axis=0, how='any').astype('int')
         proba_arr = np.zeros((len(preds), y.max() + 1))
         proba_arr[np.arange(len(preds)), preds] = 1
diff --git a/evalml/pipelines/components/transformers/column_selectors.py b/evalml/pipelines/components/transformers/column_selectors.py
index b93c255890..9e45952e58 100644
--- a/evalml/pipelines/components/transformers/column_selectors.py
+++ b/evalml/pipelines/components/transformers/column_selectors.py
@@ -37,7 +37,7 @@ def _modify_columns(self, cols, X, y=None):
         """How the transformer modifies the columns of the input data."""
 
     def fit(self, X, y=None):
-        """'Fits the transformer by checking if column names are present in the dataset.
+        """Fits the transformer by checking if column names are present in the dataset.
 
         Arguments:
             X (ww.DataTable, pd.DataFrame): Data to check.
diff --git a/evalml/pipelines/components/transformers/imputers/imputer.py b/evalml/pipelines/components/transformers/imputers/imputer.py
index 2727db101b..247b0800d5 100644
--- a/evalml/pipelines/components/transformers/imputers/imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/imputer.py
@@ -106,14 +106,13 @@ def transform(self, X, y=None):
 
         if self._numeric_cols is not None and len(self._numeric_cols) > 0:
             X_numeric = X_null_dropped[self._numeric_cols]
-            imputed = self._numeric_imputer.transform(X_numeric).to_dataframe()
-            # imputed.index = X_null_dropped.index
+            imputed = self._numeric_imputerd.index
             X_null_dropped[X_numeric.columns] = imputed
 
         if self._categorical_cols is not None and len(self._categorical_cols) > 0:
             X_categorical = X_null_dropped[self._categorical_cols]
             imputed = self._categorical_imputer.transform(X_categorical).to_dataframe()
-            # imputed.index = X_null_dropped.index
             X_null_dropped[X_categorical.columns] = imputed
         X_null_dropped = _convert_to_woodwork_structure(X_null_dropped)
+
         return X_null_dropped
diff --git a/evalml/pipelines/components/transformers/imputers/simple_imputer.py b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
index f11c84b40a..71f8ed2b6f 100644
--- a/evalml/pipelines/components/transformers/imputers/simple_imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
@@ -1,4 +1,3 @@
-import numpy as np
 import pandas as pd
 from sklearn.impute import SimpleImputer as SkImputer
 
@@ -47,13 +46,11 @@ def fit(self, X, y=None):
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
+
         # Convert all bool dtypes to category for fitting
         if (X.dtypes == bool).all():
             X = X.astype('category')
 
-        # Convert None to np.nan, since None cannot be properly handled
-        X = X.fillna(value=np.nan)
-
         self._component_obj.fit(X, y)
         self._all_null_cols = set(X.columns) - set(X.dropna(axis=1, how='all').columns)
         return self
@@ -71,28 +68,22 @@ def transform(self, X, y=None):
         """
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
-        # Convert None to np.nan, since None cannot be properly handled
-        X = X.fillna(value=np.nan)  # with woodwork, do we need this?
+
         # Return early since bool dtype doesn't support nans and sklearn errors if all cols are bool
         if (X.dtypes == bool).all():
-            X = _convert_to_woodwork_structure(X)
-            return X
+            return _convert_to_woodwork_structure(X)
+
         X_null_dropped = X.copy()
         X_null_dropped.drop(self._all_null_cols, axis=1, errors='ignore', inplace=True)
-        # category_cols = X_null_dropped.select_dtypes(include=['category']).columns
         X_t = self._component_obj.transform(X)
         if X_null_dropped.empty:
             X_t = pd.DataFrame(X_t, columns=X_null_dropped.columns)
-            X_t = _convert_to_woodwork_structure(X_t)
-            return X_t
+            return _convert_to_woodwork_structure(X_t)
+
         X_t = pd.DataFrame(X_t, columns=X_null_dropped.columns)
         X_t = X_t.infer_objects()
         X_t.index = X_null_dropped.index
-
-        # if len(category_cols) > 0:
-        #     X_t[category_cols] = X_t[category_cols].astype('category')
-        X_t = _convert_to_woodwork_structure(X_t)
-        return X_t
+        return _convert_to_woodwork_structure(X_t)
 
     def fit_transform(self, X, y=None):
         """Fits on X and transforms X
diff --git a/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py b/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
index 17b296d7e8..85af2496f7 100644
--- a/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
@@ -94,8 +94,7 @@ def transform(self, X, y=None):
         X_t = X
         features_to_extract = self.parameters["features_to_extract"]
         if len(features_to_extract) == 0:
-            X_t = _convert_to_woodwork_structure(X_t)
-            return X_t
+            return _convert_to_woodwork_structure(X_t)
         for col_name in self._date_time_col_names:
             for feature in features_to_extract:
                 name = f"{col_name}_{feature}"
@@ -104,8 +103,7 @@ def transform(self, X, y=None):
                 if categories:
                     self._categories[name] = categories
         X_t = X_t.drop(self._date_time_col_names, axis=1)
-        X_t = _convert_to_woodwork_structure(X_t)
-        return X_t
+        return _convert_to_woodwork_structure(X_t)
 
     def get_feature_names(self):
         """Gets the categories of each datetime feature.
diff --git a/evalml/pipelines/components/transformers/preprocessing/drop_null_columns.py b/evalml/pipelines/components/transformers/preprocessing/drop_null_columns.py
index 3189ade525..61a64a9c51 100644
--- a/evalml/pipelines/components/transformers/preprocessing/drop_null_columns.py
+++ b/evalml/pipelines/components/transformers/preprocessing/drop_null_columns.py
@@ -51,6 +51,4 @@ def transform(self, X, y=None):
             ww.DataTable: Transformed X
         """
         X_t = _convert_to_woodwork_structure(X)
-        # X_t = _convert_woodwork_types_wrapper(X_t.to_dataframe())
-        # return X_t.drop(columns=self._cols_to_drop, axis=1)
         return X_t.drop(self._cols_to_drop)
diff --git a/evalml/pipelines/components/transformers/preprocessing/lsa.py b/evalml/pipelines/components/transformers/preprocessing/lsa.py
index fcaa1e2f29..9c4da7c54d 100644
--- a/evalml/pipelines/components/transformers/preprocessing/lsa.py
+++ b/evalml/pipelines/components/transformers/preprocessing/lsa.py
@@ -61,7 +61,6 @@ def transform(self, X, y=None):
         text_columns = self._get_text_columns(X)
         for col in text_columns:
             transformed = self._lsa_pipeline.transform(X[col])
-
             X_t['LSA({})[0]'.format(col)] = pd.Series(transformed[:, 0], index=X.index)
             X_t['LSA({})[1]'.format(col)] = pd.Series(transformed[:, 1], index=X.index)
         X_t = X_t.drop(columns=text_columns)
diff --git a/evalml/pipelines/components/utils.py b/evalml/pipelines/components/utils.py
index b9bf06891c..281c7df287 100644
--- a/evalml/pipelines/components/utils.py
+++ b/evalml/pipelines/components/utils.py
@@ -144,10 +144,10 @@ def predict(self, X):
         """Make predictions using selected features.
 
         Arguments:
-            X (pd.DataFrame): Features
+            X (ww.DataTable, pd.DataFrame): Features
 
         Returns:
-            pd.Series: Predicted values
+            np.ndarray: Predicted values
         """
         check_is_fitted(self, 'is_fitted_')
 
@@ -157,10 +157,10 @@ def predict_proba(self, X):
         """Make probability estimates for labels.
 
         Arguments:
-            X (pd.DataFrame): Features
+            X (ww.DataTable, pd.DataFrame): Features
 
         Returns:
-            pd.DataFrame: Probability estimates
+            np.ndarray: Probability estimates
         """
         return _convert_woodwork_types_wrapper(self.pipeline.predict_proba(X).to_dataframe()).to_numpy()
 
@@ -181,8 +181,8 @@ def fit(self, X, y):
         """Fits component to data
 
         Arguments:
-            X (pd.DataFrame or np.ndarray): the input training data of shape [n_samples, n_features]
-            y (pd.Series, optional): the target training data of length [n_samples]
+            X (ww.DataTable, pd.DataFrame or np.ndarray): the input training data of shape [n_samples, n_features]
+            y (ww.DataColumn, pd.Series, optional): the target training data of length [n_samples]
 
         Returns:
             self
@@ -194,10 +194,10 @@ def predict(self, X):
         """Make predictions using selected features.
 
         Arguments:
-            X (pd.DataFrame): Features
+            X (ww.DataTable, pd.DataFrame): Features
 
         Returns:
-            pd.Series: Predicted values
+            np.ndarray: Predicted values
         """
         return self.pipeline.predict(X).to_series().to_numpy()
 
diff --git a/evalml/tests/component_tests/test_lsa.py b/evalml/tests/component_tests/test_lsa.py
index d3ac641f56..f3cf61c309 100644
--- a/evalml/tests/component_tests/test_lsa.py
+++ b/evalml/tests/component_tests/test_lsa.py
@@ -148,10 +148,6 @@ def test_lsa_output():
                  'Red, the blood of angry men - black, the dark of ages past']})
     lsa = LSA(text_columns=['lsa'])
     lsa.fit(X)
-
-    expected_features = [[0.832, 0.],
-                         [0., 1.],
-                         [0.832, 0.]]
     expected_features = pd.DataFrame([[0.832, 0.],
                                       [0., 1.],
                                       [0.832, 0.]], columns=["LSA(lsa)[0]", "LSA(lsa)[1]"])

From f18b64d03588d5b8976326d7009f7b1a55682315 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 19 Jan 2021 02:50:57 -0500
Subject: [PATCH 59/98] oops fix typos

---
 evalml/pipelines/components/transformers/imputers/imputer.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/evalml/pipelines/components/transformers/imputers/imputer.py b/evalml/pipelines/components/transformers/imputers/imputer.py
index 247b0800d5..ddcdcdfdaa 100644
--- a/evalml/pipelines/components/transformers/imputers/imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/imputer.py
@@ -106,7 +106,7 @@ def transform(self, X, y=None):
 
         if self._numeric_cols is not None and len(self._numeric_cols) > 0:
             X_numeric = X_null_dropped[self._numeric_cols]
-            imputed = self._numeric_imputerd.index
+            imputed = self._numeric_imputer.transform(X_numeric).to_dataframe()
             X_null_dropped[X_numeric.columns] = imputed
 
         if self._categorical_cols is not None and len(self._categorical_cols) > 0:

From 1ccb1526783dcde32522f0e0bd6526808051515a Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 19 Jan 2021 14:55:30 -0500
Subject: [PATCH 60/98] update partial dependence impl

---
 evalml/model_understanding/graphs.py | 85 +++++++++++++++++++++++++++-
 1 file changed, 83 insertions(+), 2 deletions(-)

diff --git a/evalml/model_understanding/graphs.py b/evalml/model_understanding/graphs.py
index 5ea3a8fd3d..7380d0f0e5 100644
--- a/evalml/model_understanding/graphs.py
+++ b/evalml/model_understanding/graphs.py
@@ -466,12 +466,37 @@ def partial_dependence(pipeline, X, feature, grid_resolution=100):
     if ((isinstance(feature, int) and X.iloc[:, feature].isnull().sum()) or (isinstance(feature, str) and X[feature].isnull().sum())):
         warnings.warn("There are null values in the features, which will cause NaN values in the partial dependence output. Fill in these values to remove the NaN values.", NullsInColumnWarning)
 
-    wrapped = scikit_learn_wrapped_estimator(pipeline)
+
+
+    # wrapped = scikit_learn_wrapped_estimator(pipeline)
     if isinstance(pipeline, evalml.pipelines.ClassificationPipeline):
+        class Pipeline(evalml.pipelines.ClassificationPipeline):
+            component_graph = pipeline.component_graph
+            problem_type = pipeline.problem_type
+            _is_fitted = True
+            def predict(self, X):
+                return pipeline.predict(X).to_series()
+
+            def predict_proba(self, X):
+                return pipeline.predict_proba(X).to_dataframe()
+        wrapped = Pipeline(parameters=pipeline.parameters)
+
         wrapped._estimator_type = "classifier"
-        wrapped.classes_ = pipeline.classes_
+        wrapped._encoder = pipeline._encoder
+
     elif isinstance(pipeline, evalml.pipelines.RegressionPipeline):
+
+        class Pipeline(evalml.pipelines.RegressionPipeline):
+            component_graph = pipeline.component_graph
+            problem_type = pipeline.problem_type
+            _is_fitted = True
+
+            def predict(self, X):
+                return pipeline.predict(X).to_series()
+        wrapped = Pipeline(parameters=pipeline.parameters)
+
         wrapped._estimator_type = "regressor"
+    # import pdb; pdb.set_trace()
     wrapped.feature_importances_ = pipeline.feature_importance
     wrapped._is_fitted = True
     avg_pred, values = sk_partial_dependence(wrapped, X=X, features=[feature], grid_resolution=grid_resolution)
@@ -489,6 +514,62 @@ def partial_dependence(pipeline, X, feature, grid_resolution=100):
 
     return data
 
+# def partial_dependence(pipeline, X, feature, grid_resolution=100):
+#     """Calculates partial dependence.
+
+#     Arguments:
+#         pipeline (PipelineBase or subclass): Fitted pipeline
+#         X (ww.DataTable, pd.DataFrame, np.ndarray): The input data used to generate a grid of values
+#             for feature where partial dependence will be calculated at
+#         feature (int, string): The target features for which to create the partial dependence plot for.
+#             If feature is an int, it must be the index of the feature to use.
+#             If feature is a string, it must be a valid column name in X.
+
+#     Returns:
+#         pd.DataFrame: DataFrame with averaged predictions for all points in the grid averaged
+#             over all samples of X and the values used to calculate those predictions. The dataframe will
+#             contain two columns: "feature_values" (grid points at which the partial dependence was calculated) and
+#             "partial_dependence" (the partial dependence at that feature value). For classification problems, there
+#             will be a third column called "class_label" (the class label for which the partial
+#             dependence was calculated). For binary classification, the partial dependence is only calculated for the
+#             "positive" class.
+
+#     """
+#     from evalml.pipelines.components.utils import scikit_learn_wrapped_estimator
+#     X = _convert_to_woodwork_structure(X)
+#     X = _convert_woodwork_types_wrapper(X.to_dataframe())
+
+#     if not pipeline._is_fitted:
+#         raise ValueError("Pipeline to calculate partial dependence for must be fitted")
+#     if pipeline.model_family == ModelFamily.BASELINE:
+#         raise ValueError("Partial dependence plots are not supported for Baseline pipelines")
+
+#     if ((isinstance(feature, int) and X.iloc[:, feature].isnull().sum()) or (isinstance(feature, str) and X[feature].isnull().sum())):
+#         warnings.warn("There are null values in the features, which will cause NaN values in the partial dependence output. Fill in these values to remove the NaN values.", NullsInColumnWarning)
+
+#     wrapped = scikit_learn_wrapped_estimator(pipeline)
+#     if isinstance(pipeline, evalml.pipelines.ClassificationPipeline):
+#         wrapped._estimator_type = "classifier"
+#         wrapped.classes_ = pipeline.classes_
+#     elif isinstance(pipeline, evalml.pipelines.RegressionPipeline):
+#         wrapped._estimator_type = "regressor"
+#     wrapped.feature_importances_ = pipeline.feature_importance
+#     wrapped._is_fitted = True
+#     avg_pred, values = sk_partial_dependence(wrapped, X=X, features=[feature], grid_resolution=grid_resolution)
+
+#     classes = None
+#     if isinstance(pipeline, evalml.pipelines.BinaryClassificationPipeline):
+#         classes = [pipeline.classes_[1]]
+#     elif isinstance(pipeline, evalml.pipelines.MulticlassClassificationPipeline):
+#         classes = pipeline.classes_
+
+#     data = pd.DataFrame({"feature_values": np.tile(values[0], avg_pred.shape[0]),
+#                          "partial_dependence": np.concatenate([pred for pred in avg_pred])})
+#     if classes is not None:
+#         data['class_label'] = np.repeat(classes, len(values[0]))
+
+#     return data
+
 
 def graph_partial_dependence(pipeline, X, feature, class_label=None, grid_resolution=100):
     """Create an one-way partial dependence plot.

From afe07414c8ab022bde272ed58de09559278e75a8 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 20 Jan 2021 02:33:53 -0500
Subject: [PATCH 61/98] fix knn

---
 evalml/tests/component_tests/test_knn_classifier.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/evalml/tests/component_tests/test_knn_classifier.py b/evalml/tests/component_tests/test_knn_classifier.py
index 979ba0baba..967a4d158b 100644
--- a/evalml/tests/component_tests/test_knn_classifier.py
+++ b/evalml/tests/component_tests/test_knn_classifier.py
@@ -31,8 +31,8 @@ def test_fit_predict_binary(X_y_binary):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series(), decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe(), decimal=5)
 
 
 def test_fit_predict_multi(X_y_multi):
@@ -48,8 +48,8 @@ def test_fit_predict_multi(X_y_multi):
     y_pred = clf.predict(X)
     y_pred_proba = clf.predict_proba(X)
 
-    np.testing.assert_almost_equal(y_pred, y_pred_sk, decimal=5)
-    np.testing.assert_almost_equal(y_pred_proba, y_pred_proba_sk, decimal=5)
+    np.testing.assert_almost_equal(y_pred_sk, y_pred.to_series(), decimal=5)
+    np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe(), decimal=5)
 
 
 def test_feature_importance(X_y_binary):

From 69c83ca5eea0f8f4bd35646d273cc9c078a79e3c Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 20 Jan 2021 07:30:53 -0500
Subject: [PATCH 62/98] clean up graphs

---
 evalml/model_understanding/graphs.py | 85 +---------------------------
 1 file changed, 2 insertions(+), 83 deletions(-)

diff --git a/evalml/model_understanding/graphs.py b/evalml/model_understanding/graphs.py
index 4db4295086..c8aab73732 100644
--- a/evalml/model_understanding/graphs.py
+++ b/evalml/model_understanding/graphs.py
@@ -454,7 +454,6 @@ def partial_dependence(pipeline, X, feature, grid_resolution=100):
             "positive" class.
 
     """
-    from evalml.pipelines.components.utils import scikit_learn_wrapped_estimator
     X = _convert_to_woodwork_structure(X)
     X = _convert_woodwork_types_wrapper(X.to_dataframe())
 
@@ -466,36 +465,12 @@ def partial_dependence(pipeline, X, feature, grid_resolution=100):
     if ((isinstance(feature, int) and X.iloc[:, feature].isnull().sum()) or (isinstance(feature, str) and X[feature].isnull().sum())):
         warnings.warn("There are null values in the features, which will cause NaN values in the partial dependence output. Fill in these values to remove the NaN values.", NullsInColumnWarning)
 
-    # wrapped = scikit_learn_wrapped_estimator(pipeline)
+    wrapped = evalml.pipelines.components.utils.scikit_learn_wrapped_estimator(pipeline)
     if isinstance(pipeline, evalml.pipelines.ClassificationPipeline):
-        class Pipeline(evalml.pipelines.ClassificationPipeline):
-            component_graph = pipeline.component_graph
-            problem_type = pipeline.problem_type
-            _is_fitted = True
-
-            def predict(self, X):
-                return pipeline.predict(X).to_series()
-
-            def predict_proba(self, X):
-                return pipeline.predict_proba(X).to_dataframe()
-        wrapped = Pipeline(parameters=pipeline.parameters)
-
         wrapped._estimator_type = "classifier"
-        wrapped._encoder = pipeline._encoder
-
+        wrapped.classes_ = pipeline.classes_
     elif isinstance(pipeline, evalml.pipelines.RegressionPipeline):
-
-        class Pipeline(evalml.pipelines.RegressionPipeline):
-            component_graph = pipeline.component_graph
-            problem_type = pipeline.problem_type
-            _is_fitted = True
-
-            def predict(self, X):
-                return pipeline.predict(X).to_series()
-        wrapped = Pipeline(parameters=pipeline.parameters)
-
         wrapped._estimator_type = "regressor"
-    # import pdb; pdb.set_trace()
     wrapped.feature_importances_ = pipeline.feature_importance
     wrapped._is_fitted = True
     avg_pred, values = sk_partial_dependence(wrapped, X=X, features=[feature], grid_resolution=grid_resolution)
@@ -513,62 +488,6 @@ def predict(self, X):
 
     return data
 
-# def partial_dependence(pipeline, X, feature, grid_resolution=100):
-#     """Calculates partial dependence.
-
-#     Arguments:
-#         pipeline (PipelineBase or subclass): Fitted pipeline
-#         X (ww.DataTable, pd.DataFrame, np.ndarray): The input data used to generate a grid of values
-#             for feature where partial dependence will be calculated at
-#         feature (int, string): The target features for which to create the partial dependence plot for.
-#             If feature is an int, it must be the index of the feature to use.
-#             If feature is a string, it must be a valid column name in X.
-
-#     Returns:
-#         pd.DataFrame: DataFrame with averaged predictions for all points in the grid averaged
-#             over all samples of X and the values used to calculate those predictions. The dataframe will
-#             contain two columns: "feature_values" (grid points at which the partial dependence was calculated) and
-#             "partial_dependence" (the partial dependence at that feature value). For classification problems, there
-#             will be a third column called "class_label" (the class label for which the partial
-#             dependence was calculated). For binary classification, the partial dependence is only calculated for the
-#             "positive" class.
-
-#     """
-#     from evalml.pipelines.components.utils import scikit_learn_wrapped_estimator
-#     X = _convert_to_woodwork_structure(X)
-#     X = _convert_woodwork_types_wrapper(X.to_dataframe())
-
-#     if not pipeline._is_fitted:
-#         raise ValueError("Pipeline to calculate partial dependence for must be fitted")
-#     if pipeline.model_family == ModelFamily.BASELINE:
-#         raise ValueError("Partial dependence plots are not supported for Baseline pipelines")
-
-#     if ((isinstance(feature, int) and X.iloc[:, feature].isnull().sum()) or (isinstance(feature, str) and X[feature].isnull().sum())):
-#         warnings.warn("There are null values in the features, which will cause NaN values in the partial dependence output. Fill in these values to remove the NaN values.", NullsInColumnWarning)
-
-#     wrapped = scikit_learn_wrapped_estimator(pipeline)
-#     if isinstance(pipeline, evalml.pipelines.ClassificationPipeline):
-#         wrapped._estimator_type = "classifier"
-#         wrapped.classes_ = pipeline.classes_
-#     elif isinstance(pipeline, evalml.pipelines.RegressionPipeline):
-#         wrapped._estimator_type = "regressor"
-#     wrapped.feature_importances_ = pipeline.feature_importance
-#     wrapped._is_fitted = True
-#     avg_pred, values = sk_partial_dependence(wrapped, X=X, features=[feature], grid_resolution=grid_resolution)
-
-#     classes = None
-#     if isinstance(pipeline, evalml.pipelines.BinaryClassificationPipeline):
-#         classes = [pipeline.classes_[1]]
-#     elif isinstance(pipeline, evalml.pipelines.MulticlassClassificationPipeline):
-#         classes = pipeline.classes_
-
-#     data = pd.DataFrame({"feature_values": np.tile(values[0], avg_pred.shape[0]),
-#                          "partial_dependence": np.concatenate([pred for pred in avg_pred])})
-#     if classes is not None:
-#         data['class_label'] = np.repeat(classes, len(values[0]))
-
-#     return data
-
 
 def graph_partial_dependence(pipeline, X, feature, class_label=None, grid_resolution=100):
     """Create an one-way partial dependence plot.

From 7c38b624e5fc8bbb3090801cceb8f580c690b227 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 20 Jan 2021 07:39:50 -0500
Subject: [PATCH 63/98] some more cleanup

---
 .../prediction_explanations/_algorithms.py    |  1 -
 evalml/pipelines/classification_pipeline.py   |  4 +--
 evalml/pipelines/component_graph.py           | 32 ++++++++-----------
 3 files changed, 15 insertions(+), 22 deletions(-)

diff --git a/evalml/model_understanding/prediction_explanations/_algorithms.py b/evalml/model_understanding/prediction_explanations/_algorithms.py
index cfb40b49e6..83b262fd90 100644
--- a/evalml/model_understanding/prediction_explanations/_algorithms.py
+++ b/evalml/model_understanding/prediction_explanations/_algorithms.py
@@ -83,7 +83,6 @@ def _compute_shap_values(pipeline, features, training_data=None):
         # More than 100 datapoints can negatively impact runtime according to SHAP
         # https://github.com/slundberg/shap/blob/master/shap/explainers/kernel.py#L114
         sampled_training_data_features = pipeline.compute_estimator_features(shap.sample(training_data, 100)).to_dataframe()
-        # sampled_training_data_features = _convert_woodwork_types_wrapper(sampled_training_data_features.to_dataframe())
         sampled_training_data_features = check_array(sampled_training_data_features)
 
         if pipeline.problem_type == ProblemTypes.REGRESSION:
diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index b13e8a6f14..f46fdbeb5d 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -78,7 +78,6 @@ def _predict(self, X, objective=None):
         Returns:
             pd.Series: Estimated labels
         """
-        # why does this not use objectives... because multiclass doesnt? so maybe this should be moved for less confusion
         return self._component_graph.predict(X)
 
     def predict(self, X, objective=None):
@@ -91,8 +90,7 @@ def predict(self, X, objective=None):
         Returns:
             pd.Series : Estimated labels
         """
-        predictions = self._predict(X, objective)
-        predictions = predictions.to_series()
+        predictions = self._predict(X, objective).to_series()
         predictions = pd.Series(self._decode_targets(predictions), name=self.input_target_name)
         return _convert_to_woodwork_structure(predictions)
 
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 0d2f828d1d..bfd983b1c7 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -88,8 +88,8 @@ def fit(self, X, y):
         """Fit each component in the graph
 
         Arguments:
-            X (pd.DataFrame): The input training data of shape [n_samples, n_features]
-            y (pd.Series): The target training data of length [n_samples]
+            X (ww.DataTable, pd.DataFrame): The input training data of shape [n_samples, n_features]
+            y (ww.DataColumn, pd.Series): The target training data of length [n_samples]
         """
         self._compute_features(self.compute_order, X, y, fit=True)
         return self
@@ -98,8 +98,8 @@ def fit_features(self, X, y):
         """ Fit all components save the final one, usually an estimator
 
         Arguments:
-            X (pd.DataFrame): The input training data of shape [n_samples, n_features]
-            y (pd.Series): The target training data of length [n_samples]
+            X (ww.DataTable, pd.DataFrame): The input training data of shape [n_samples, n_features]
+            y (ww.DataColumn, pd.Series): The target training data of length [n_samples]
 
         Returns:
             ww.DataTable
@@ -121,17 +121,16 @@ def fit_features(self, X, y):
         return _convert_to_woodwork_structure(concatted)
 
     def predict(self, X):
-        ### TODO
         """Make predictions using selected features.
 
         Arguments:
-            X (pd.DataFrame): Data of shape [n_samples, n_features]
+            X (ww.DataTable, pd.DataFrame): Data of shape [n_samples, n_features]
 
         Returns:
-            pd.Series: Predicted values.
+            ww.DataColumn: Predicted values.
         """
         if len(self.compute_order) == 0:
-            return X
+            return _convert_to_woodwork_structure(X)
         final_component = self.compute_order[-1]
         outputs = self._compute_features(self.compute_order, X)
         return _convert_to_woodwork_structure(outputs.get(final_component, outputs.get(f'{final_component}.x')))
@@ -142,21 +141,19 @@ def compute_final_component_features(self, X, y=None):
         to get all the information that should be fed to the final component
 
         Arguments:
-            X (pd.DataFrame): Data of shape [n_samples, n_features]
+            X (ww.DataTable, pd.DataFrame): Data of shape [n_samples, n_features]
 
         Returns:
-            pd.DataFrame: Transformed values.
+            ww.DataTable: Transformed values.
         """
         if len(self.compute_order) <= 1:
-            return X
-
+            return _convert_to_woodwork_structure(X)
         component_outputs = self._compute_features(self.compute_order[:-1], X, y=y, fit=False)
         final_component_inputs = []
         for parent in self.get_parents(self.compute_order[-1]):
             parent_output = component_outputs.get(parent, component_outputs.get(f'{parent}.x'))
             if isinstance(parent_output, ww.DataColumn):
-                parent_output = parent_output.to_series()
-                parent_output = pd.DataFrame(parent_output, columns=[parent])
+                parent_output = pd.DataFrame(parent_output.to_series(), columns=[parent])
                 parent_output = _convert_to_woodwork_structure(parent_output)
             final_component_inputs.append(parent_output)
         concatted = pd.concat([i.to_dataframe() if isinstance(i, ww.DataTable) else i for i in final_component_inputs], axis=1)
@@ -167,18 +164,17 @@ def _compute_features(self, component_list, X, y=None, fit=False):
 
         Arguments:
             component_list (list): The list of component names to compute.
-            X (pd.DataFrame): Input data to the pipeline to transform.
-            y (pd.Series): The target training data of length [n_samples]
+            X (ww.DataTable, d.DataFrame): Input data to the pipeline to transform.
+            y (ww.DataColumn, pd.Series): The target training data of length [n_samples]
             fit (bool): Whether to fit the estimators as well as transform it.
                         Defaults to False.
 
         Returns:
             dict - outputs from each component
         """
+        X = _convert_to_woodwork_structure(X)
         if len(component_list) == 0:
             return X
-        X = _convert_to_woodwork_structure(X)
-
         output_cache = {}
         original_logical_types = X.logical_types
         for component_name in component_list:

From 8ce1c11b152e3b580295574b5c4ab3b8b9cf8798 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 20 Jan 2021 07:42:12 -0500
Subject: [PATCH 64/98] cleanup gen utils

---
 evalml/utils/gen_utils.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/evalml/utils/gen_utils.py b/evalml/utils/gen_utils.py
index 46900aa589..1dc2d75d83 100644
--- a/evalml/utils/gen_utils.py
+++ b/evalml/utils/gen_utils.py
@@ -367,7 +367,7 @@ def pad_with_nans(pd_data, num_to_pad):
     Returns:
         pd.DataFrame or pd.Series
     """
-    if isinstance(pd_data, pd.Series) or isinstance(pd_data, ww.DataColumn):
+    if isinstance(pd_data, pd.Series):
         padding = pd.Series([np.nan] * num_to_pad, name=pd_data.name)
     else:
         padding = pd.DataFrame({col: [np.nan] * num_to_pad

From 4dcddb93aa2d7672c2ccf86c2e671e4f3d951d62 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 20 Jan 2021 22:48:28 -0500
Subject: [PATCH 65/98] fix tests

---
 evalml/tests/pipeline_tests/test_component_graph.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index ef74fd2d08..efeb7fd61f 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -499,7 +499,7 @@ def test_compute_final_component_features_single_component(mock_transform, X_y_b
     component_graph.fit(X, y)
 
     X_t = component_graph.compute_final_component_features(X)
-    assert_frame_equal(X, X_t)
+    assert_frame_equal(X, X_t.to_dataframe())
 
 
 @patch('evalml.pipelines.components.Imputer.fit_transform')
@@ -523,7 +523,7 @@ def test_predict_empty_graph(X_y_binary):
 
     component_graph.fit(X, y)
     X_t = component_graph.predict(X)
-    assert_frame_equal(X, X_t)
+    assert_frame_equal(X, X_t.to_dataframe())
 
 
 @patch('evalml.pipelines.components.OneHotEncoder.fit_transform')

From 7b4e4e5035859eac75c27a231ea14c3f5b9240b2 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Wed, 20 Jan 2021 23:31:19 -0500
Subject: [PATCH 66/98] major cleanup, condense component graph

---
 docs/source/user_guide/pipelines.ipynb        |  5 +-
 evalml/automl/automl_search.py                |  5 +-
 evalml/model_understanding/graphs.py          |  1 +
 .../binary_classification_pipeline.py         |  3 +-
 evalml/pipelines/classification_pipeline.py   | 10 ++--
 evalml/pipelines/component_graph.py           | 57 ++++++++-----------
 evalml/preprocessing/utils.py                 | 14 ++---
 7 files changed, 40 insertions(+), 55 deletions(-)

diff --git a/docs/source/user_guide/pipelines.ipynb b/docs/source/user_guide/pipelines.ipynb
index cc48817c3c..f055c51f33 100644
--- a/docs/source/user_guide/pipelines.ipynb
+++ b/docs/source/user_guide/pipelines.ipynb
@@ -410,9 +410,8 @@
     "        \"\"\"\n",
     "\n",
     "        X = _convert_to_woodwork_structure(X)\n",
-    "        X = _convert_woodwork_types_wrapper(X.to_dataframe())\n",
-    "        X_t = X.drop(columns=self._cols_to_drop, axis=1)\n",
-    "        return _convert_to_woodwork_structure(X_t)\n",
+    "        return X.drop(columns=self._cols_to_drop)\n",
+    "\n",
     "\n",
     "class CustomPipeline(MulticlassClassificationPipeline):\n",
     "    name = \"Custom Pipeline\"\n",
diff --git a/evalml/automl/automl_search.py b/evalml/automl/automl_search.py
index cd38586247..511b6cca01 100644
--- a/evalml/automl/automl_search.py
+++ b/evalml/automl/automl_search.py
@@ -567,8 +567,8 @@ def _tune_binary_threshold(self, pipeline, X_threshold_tuning, y_threshold_tunin
 
         Arguments:
             pipeline (Pipeline): Pipeline instance to threshold
-            X_threshold_tuning (ww DataTable): X data to tune pipeline to
-            y_threshold_tuning (ww DataColumn): Target data to tune pipeline to
+            X_threshold_tuning (ww.DataTable): X data to tune pipeline to
+            y_threshold_tuning (ww.DataColumn): Target data to tune pipeline to
 
         Returns:
             Trained pipeline instance
@@ -577,7 +577,6 @@ def _tune_binary_threshold(self, pipeline, X_threshold_tuning, y_threshold_tunin
             pipeline.threshold = 0.5
             if X_threshold_tuning:
                 y_predict_proba = pipeline.predict_proba(X_threshold_tuning)
-                # y_predict_proba = y_predict_proba.to_dataframe().iloc[:, 1]
                 y_predict_proba = y_predict_proba.iloc[:, 1]
                 pipeline.threshold = self.objective.optimize_threshold(y_predict_proba, y_threshold_tuning, X=X_threshold_tuning)
         return pipeline
diff --git a/evalml/model_understanding/graphs.py b/evalml/model_understanding/graphs.py
index c8aab73732..a92be72581 100644
--- a/evalml/model_understanding/graphs.py
+++ b/evalml/model_understanding/graphs.py
@@ -473,6 +473,7 @@ def partial_dependence(pipeline, X, feature, grid_resolution=100):
         wrapped._estimator_type = "regressor"
     wrapped.feature_importances_ = pipeline.feature_importance
     wrapped._is_fitted = True
+
     avg_pred, values = sk_partial_dependence(wrapped, X=X, features=[feature], grid_resolution=grid_resolution)
 
     classes = None
diff --git a/evalml/pipelines/binary_classification_pipeline.py b/evalml/pipelines/binary_classification_pipeline.py
index 30ab750a79..d016322ea9 100644
--- a/evalml/pipelines/binary_classification_pipeline.py
+++ b/evalml/pipelines/binary_classification_pipeline.py
@@ -36,8 +36,7 @@ def _predict(self, X, objective=None):
 
         if self.threshold is None:
             return self._component_graph.predict(X)
-        ypred_proba = self.predict_proba(X)
-        ypred_proba = ypred_proba.to_dataframe()
+        ypred_proba = self.predict_proba(X).to_dataframe()
         ypred_proba = ypred_proba.iloc[:, 1]
         if objective is None:
             return _convert_to_woodwork_structure(ypred_proba > self.threshold)
diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index f46fdbeb5d..38bf84f532 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -72,11 +72,11 @@ def _predict(self, X, objective=None):
         """Make predictions using selected features.
 
         Arguments:
-            X (pd.DataFrame): Data of shape [n_samples, n_features]
+            X (ww.DataTable, pd.DataFrame): Data of shape [n_samples, n_features]
             objective (Object or string): The objective to use to make predictions
 
         Returns:
-            pd.Series: Estimated labels
+            ww.DataColumn: Estimated labels
         """
         return self._component_graph.predict(X)
 
@@ -105,8 +105,6 @@ def predict_proba(self, X):
         """
         X = self.compute_estimator_features(X, y=None)
         proba = self.estimator.predict_proba(X).to_dataframe()
-        # proba = self.estimator.predict_proba(X)
-        # proba = proba.rename({old_name: new_name for old_name, new_name in zip(list(proba.columns.keys), self._encoder.classes_)})
         proba.columns = self._encoder.classes_
         return _convert_to_woodwork_structure(proba)
 
@@ -127,11 +125,11 @@ def score(self, X, y, objectives):
         y = self._encode_targets(y)
         y_predicted, y_predicted_proba = self._compute_predictions(X, objectives)
         if y_predicted is not None:
-            y_predicted = _convert_to_woodwork_structure(y_predicted)
+            # y_predicted = _convert_to_woodwork_structure(y_predicted)
             y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
 
         if y_predicted_proba is not None:
-            y_predicted_proba = _convert_to_woodwork_structure(y_predicted_proba)
+            # y_predicted_proba = _convert_to_woodwork_structure(y_predicted_proba)
             y_predicted_proba = _convert_woodwork_types_wrapper(y_predicted_proba.to_dataframe())
         return self._score_all_objectives(X, y, y_predicted, y_predicted_proba, objectives)
 
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index bfd983b1c7..0704347378 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -102,12 +102,27 @@ def fit_features(self, X, y):
             y (ww.DataColumn, pd.Series): The target training data of length [n_samples]
 
         Returns:
-            ww.DataTable
+            ww.DataTable: Transformed values.
+        """
+        return self._fit_transform_feature_helper(True, X, y)
+
+    def compute_final_component_features(self, X, y=None):
+        """Transform all components save the final one, and gathers the data from any number of parents
+        to get all the information that should be fed to the final component
+
+        Arguments:
+            X (ww.DataTable, pd.DataFrame): Data of shape [n_samples, n_features]
+            y (ww.DataColumn, pd.Series): The target training data of length [n_samples]. Defaults to None.
+
+        Returns:
+            ww.DataTable: Transformed values.
         """
+        return self._fit_transform_feature_helper(False, X, y)
+
+    def _fit_transform_feature_helper(self, fit, X, y=None):
         if len(self.compute_order) <= 1:
             return _convert_to_woodwork_structure(X)
-
-        component_outputs = self._compute_features(self.compute_order[:-1], X, y=y, fit=True)
+        component_outputs = self._compute_features(self.compute_order[:-1], X, y=y, fit=fit)
         final_component_inputs = []
         for parent in self.get_parents(self.compute_order[-1]):
             parent_output = component_outputs.get(parent, component_outputs.get(f'{parent}.x'))
@@ -116,7 +131,6 @@ def fit_features(self, X, y):
                 parent_output = pd.DataFrame(parent_output, columns=[parent])
                 parent_output = _convert_to_woodwork_structure(parent_output)
             final_component_inputs.append(parent_output)
-
         concatted = pd.concat([component_input.to_dataframe() for component_input in final_component_inputs], axis=1)
         return _convert_to_woodwork_structure(concatted)
 
@@ -135,30 +149,6 @@ def predict(self, X):
         outputs = self._compute_features(self.compute_order, X)
         return _convert_to_woodwork_structure(outputs.get(final_component, outputs.get(f'{final_component}.x')))
 
-    def compute_final_component_features(self, X, y=None):
-        ### TODO: COMBINE WITH fit_features
-        """ Transform all components save the final one, and gathers the data from any number of parents
-        to get all the information that should be fed to the final component
-
-        Arguments:
-            X (ww.DataTable, pd.DataFrame): Data of shape [n_samples, n_features]
-
-        Returns:
-            ww.DataTable: Transformed values.
-        """
-        if len(self.compute_order) <= 1:
-            return _convert_to_woodwork_structure(X)
-        component_outputs = self._compute_features(self.compute_order[:-1], X, y=y, fit=False)
-        final_component_inputs = []
-        for parent in self.get_parents(self.compute_order[-1]):
-            parent_output = component_outputs.get(parent, component_outputs.get(f'{parent}.x'))
-            if isinstance(parent_output, ww.DataColumn):
-                parent_output = pd.DataFrame(parent_output.to_series(), columns=[parent])
-                parent_output = _convert_to_woodwork_structure(parent_output)
-            final_component_inputs.append(parent_output)
-        concatted = pd.concat([i.to_dataframe() if isinstance(i, ww.DataTable) else i for i in final_component_inputs], axis=1)
-        return _convert_to_woodwork_structure(concatted)
-
     def _compute_features(self, component_list, X, y=None, fit=False):
         """Transforms the data by applying the given components.
 
@@ -170,7 +160,7 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                         Defaults to False.
 
         Returns:
-            dict - outputs from each component
+            dict: Outputs from each component
         """
         X = _convert_to_woodwork_structure(X)
         if len(component_list) == 0:
@@ -229,7 +219,7 @@ def _compute_features(self, component_list, X, y=None, fit=False):
 
     @staticmethod
     def _consolidate_inputs(x_inputs, y_input, X, y):
-        """ Combines any/all X and y inputs for a component, including handling defaults
+        """Combines any/all X and y inputs for a component, including handling defaults
 
         Arguments:
             x_inputs (list(pd.DataFrame)): Data to be used as X input for a component
@@ -238,10 +228,8 @@ def _consolidate_inputs(x_inputs, y_input, X, y):
             y (pd.Series): The original y input, to be used if there is no parent y input
 
         Returns:
-            pd.DataFrame, pd.Series: The X and y transformed values to evaluate a component with
+            ww.DataTable, ww.DataColumn: The X and y transformed values to evaluate a component with
         """
-        merged_types_dict = {}
-
         if len(x_inputs) == 0:
             return_x = X
         else:
@@ -250,7 +238,8 @@ def _consolidate_inputs(x_inputs, y_input, X, y):
         if y_input is not None:
             return_y = y_input
         return_x = _convert_to_woodwork_structure(return_x)
-        return_x.set_types(merged_types_dict)
+        return_y = _convert_to_woodwork_structure(return_y)
+
         return return_x, return_y
 
     def get_component(self, component_name):
diff --git a/evalml/preprocessing/utils.py b/evalml/preprocessing/utils.py
index b39d5c27cc..029eaf119a 100644
--- a/evalml/preprocessing/utils.py
+++ b/evalml/preprocessing/utils.py
@@ -48,12 +48,12 @@ def load_data(path, index, target, n_rows=None, drop=None, verbose=True, **kwarg
 
 
 def split_data(X, y, problem_type, problem_configuration=None, test_size=.2, random_state=0):
-    """splits data into train and test sets.
+    """Splits data into train and test sets.
 
     Arguments:
-        X (ww.datatable, pd.dataframe or np.ndarray): data of shape [n_samples, n_features]
-        y (ww.datacolumn, pd.series, or np.ndarray): target data of length [n_samples]
-        problem_type (str or problemtypes): type of supervised learning problem. see evalml.problem_types.problemtype.all_problem_types for a full list.
+        X (ww.Datatable, pd.Dataframe or np.ndarray): data of shape [n_samples, n_features]
+        y (ww.Datacolumn, pd.Series, or np.ndarray): target data of length [n_samples]
+        problem_type (str or ProblemTypes): type of supervised learning problem. see evalml.problem_types.problemtype.all_problem_types for a full list.
         problem_configuration (dict, None): Additional parameters needed to configure the search. For example,
             in time series problems, values should be passed in for the gap and max_delay variables.
         test_size (float): What percentage of data points should be included in the test set. Defaults to 0.2 (20%).
@@ -122,11 +122,11 @@ def drop_nan_target_rows(X, y):
     """Drops rows in X and y when row in the target y has a value of NaN.
 
     Arguments:
-        X (pd.DataFrame): Data to transform
-        y (pd.Series): Target data
+        X (pd.DataFrame, np.ndarray): Data to transform
+        y (pd.Series, np.ndarray): Target data
 
     Returns:
-        pd.DataFrame: Transformed X (and y, if passed in) with rows that had a NaN value removed.
+        pd.DataFrame, pd.DataFrame: Transformed X (and y, if passed in) with rows that had a NaN value removed.
     """
     X_t = X
     y_t = y

From c21c3aa2c4c88f6e1e230e1d283982625d73c92c Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 00:08:27 -0500
Subject: [PATCH 67/98] oops fix test

---
 evalml/pipelines/classification_pipeline.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index 38bf84f532..aad0cd842c 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -125,11 +125,11 @@ def score(self, X, y, objectives):
         y = self._encode_targets(y)
         y_predicted, y_predicted_proba = self._compute_predictions(X, objectives)
         if y_predicted is not None:
-            # y_predicted = _convert_to_woodwork_structure(y_predicted)
+            y_predicted = _convert_to_woodwork_structure(y_predicted)
             y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
 
         if y_predicted_proba is not None:
-            # y_predicted_proba = _convert_to_woodwork_structure(y_predicted_proba)
+            y_predicted_proba = _convert_to_woodwork_structure(y_predicted_proba)
             y_predicted_proba = _convert_woodwork_types_wrapper(y_predicted_proba.to_dataframe())
         return self._score_all_objectives(X, y, y_predicted, y_predicted_proba, objectives)
 

From 316d7d24347fbccd95719afc33e967c0c7dd2bfa Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 00:14:51 -0500
Subject: [PATCH 68/98] fix tests

---
 evalml/pipelines/classification_pipeline.py | 2 --
 evalml/pipelines/component_graph.py         | 4 ++--
 evalml/tests/automl_tests/test_automl.py    | 2 +-
 3 files changed, 3 insertions(+), 5 deletions(-)

diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index aad0cd842c..a421d07c96 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -125,11 +125,9 @@ def score(self, X, y, objectives):
         y = self._encode_targets(y)
         y_predicted, y_predicted_proba = self._compute_predictions(X, objectives)
         if y_predicted is not None:
-            y_predicted = _convert_to_woodwork_structure(y_predicted)
             y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
 
         if y_predicted_proba is not None:
-            y_predicted_proba = _convert_to_woodwork_structure(y_predicted_proba)
             y_predicted_proba = _convert_woodwork_types_wrapper(y_predicted_proba.to_dataframe())
         return self._score_all_objectives(X, y, y_predicted, y_predicted_proba, objectives)
 
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 0704347378..c7c31c525d 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -238,8 +238,8 @@ def _consolidate_inputs(x_inputs, y_input, X, y):
         if y_input is not None:
             return_y = y_input
         return_x = _convert_to_woodwork_structure(return_x)
-        return_y = _convert_to_woodwork_structure(return_y)
-
+        if return_y is not None:
+            return_y = _convert_to_woodwork_structure(return_y)
         return return_x, return_y
 
     def get_component(self, component_name):
diff --git a/evalml/tests/automl_tests/test_automl.py b/evalml/tests/automl_tests/test_automl.py
index 9921a47b40..385f413ea2 100644
--- a/evalml/tests/automl_tests/test_automl.py
+++ b/evalml/tests/automl_tests/test_automl.py
@@ -75,7 +75,7 @@ def test_search_results(X_y_regression, X_y_binary, X_y_multi, automl_type):
         expected_pipeline_class = MulticlassClassificationPipeline
         X, y = X_y_multi
 
-    automl = AutoMLSearch(X_train=X, y_train=y, problem_type=automl_type, max_iterations=2, n_jobs=1)
+    automl = AutoMLSearch(X_train=X, y_train=y, problem_type=automl_type, max_iterations=2, n_jobs=1, error_callback=raise_error_callback)
     automl.search()
     assert automl.results.keys() == {'pipeline_results', 'search_order', 'errors'}
     assert automl.results['search_order'] == [0, 1]

From 0c69dfbfd248e3faf37b07758a8487d53c09c7b6 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 01:18:24 -0500
Subject: [PATCH 69/98] fix more tests

---
 evalml/tests/pipeline_tests/test_pipelines.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/evalml/tests/pipeline_tests/test_pipelines.py b/evalml/tests/pipeline_tests/test_pipelines.py
index 63f3668b19..e197d1e0eb 100644
--- a/evalml/tests/pipeline_tests/test_pipelines.py
+++ b/evalml/tests/pipeline_tests/test_pipelines.py
@@ -909,9 +909,9 @@ def test_score_multiclass_single(mock_predict, mock_fit, mock_encode, X_y_binary
 @patch('evalml.pipelines.MulticlassClassificationPipeline._encode_targets')
 @patch('evalml.pipelines.MulticlassClassificationPipeline.fit')
 @patch('evalml.pipelines.ComponentGraph.predict')
-def test_score_nonlinear_multiclass(mock_encode, mock_fit, mock_predict, nonlinear_multiclass_pipeline_class, X_y_multi):
+def test_score_nonlinear_multiclass(mock_predict, mock_fit, mock_encode, nonlinear_multiclass_pipeline_class, X_y_multi):
     X, y = X_y_multi
-    mock_predict.return_value = y
+    mock_predict.return_value = ww.DataColumn(y)
     mock_encode.return_value = y
     clf = nonlinear_multiclass_pipeline_class({})
     clf.fit(X, y)
@@ -1016,7 +1016,7 @@ def test_score_binary_objective_error(mock_predict, mock_fit, mock_objective_sco
 def test_score_nonlinear_binary_objective_error(mock_predict, mock_fit, mock_objective_score, mock_encode, nonlinear_binary_pipeline_class, X_y_binary):
     mock_objective_score.side_effect = Exception('finna kabooom 💣')
     X, y = X_y_binary
-    mock_predict.return_value = y
+    mock_predict.return_value = ww.DataColumn(y)
     mock_encode.return_value = y
     clf = nonlinear_binary_pipeline_class({})
     clf.fit(X, y)
@@ -1061,10 +1061,10 @@ def test_compute_estimator_features(mock_scaler, mock_ohe, mock_imputer, X_y_bin
     X, y = X_y_binary
     X = pd.DataFrame(X)
     X_expected = pd.DataFrame(index=X.index, columns=X.columns).fillna(0)
+    mock_imputer.return_value = ww.DataTable(X)
+    mock_ohe.return_value = ww.DataTable(X)
+    mock_scaler.return_value = ww.DataTable(X_expected)
     X_expected = X_expected.astype("Int64")
-    mock_imputer.return_value = X
-    mock_ohe.return_value = X
-    mock_scaler.return_value = X_expected
 
     pipeline = logistic_regression_binary_pipeline_class({})
     pipeline.fit(X, y)

From 152d1ce766f38e117bc16cf17dddac1a013efdb0 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 13:22:17 -0500
Subject: [PATCH 70/98] rename helper and add docstrings

---
 evalml/pipelines/component_graph.py | 20 +++++++++++++++-----
 1 file changed, 15 insertions(+), 5 deletions(-)

diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index c7c31c525d..12f2e04738 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -95,7 +95,7 @@ def fit(self, X, y):
         return self
 
     def fit_features(self, X, y):
-        """ Fit all components save the final one, usually an estimator
+        """Fit all components save the final one, usually an estimator
 
         Arguments:
             X (ww.DataTable, pd.DataFrame): The input training data of shape [n_samples, n_features]
@@ -104,7 +104,7 @@ def fit_features(self, X, y):
         Returns:
             ww.DataTable: Transformed values.
         """
-        return self._fit_transform_feature_helper(True, X, y)
+        return self._fit_transform_features_helper(True, X, y)
 
     def compute_final_component_features(self, X, y=None):
         """Transform all components save the final one, and gathers the data from any number of parents
@@ -117,12 +117,22 @@ def compute_final_component_features(self, X, y=None):
         Returns:
             ww.DataTable: Transformed values.
         """
-        return self._fit_transform_feature_helper(False, X, y)
+        return self._fit_transform_features_helper(False, X, y)
 
-    def _fit_transform_feature_helper(self, fit, X, y=None):
+    def _fit_transform_features_helper(self, needs_fitting, X, y=None):
+        """Helper function that transforms the input data based on the component graph components.
+
+        Arguments:
+            needs_fitting (bool): Determines if components should be fit.
+            X (ww.DataTable, pd.DataFrame): Data of shape [n_samples, n_features]
+            y (ww.DataColumn, pd.Series): The target training data of length [n_samples]. Defaults to None.
+
+        Returns:
+            ww.DataTable: Transformed values.
+        """
         if len(self.compute_order) <= 1:
             return _convert_to_woodwork_structure(X)
-        component_outputs = self._compute_features(self.compute_order[:-1], X, y=y, fit=fit)
+        component_outputs = self._compute_features(self.compute_order[:-1], X, y=y, fit=needs_fitting)
         final_component_inputs = []
         for parent in self.get_parents(self.compute_order[-1]):
             parent_output = component_outputs.get(parent, component_outputs.get(f'{parent}.x'))

From 0ac7bb9f11c6558348e388d6682db2f6578cb711 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 13:58:18 -0500
Subject: [PATCH 71/98] cleaning up docstrings and linting

---
 .../automl_algorithm/automl_algorithm.py      |  2 +-
 .../automl_algorithm/iterative_algorithm.py   |  2 +-
 evalml/automl/automl_search.py                |  4 +--
 evalml/automl/utils.py                        | 16 +++++-----
 evalml/data_checks/outliers_data_check.py     |  2 +-
 evalml/model_understanding/graphs.py          |  2 +-
 evalml/pipelines/classification_pipeline.py   |  2 +-
 evalml/pipelines/component_graph.py           | 30 +++++++++----------
 .../ensemble/stacked_ensemble_base.py         |  2 +-
 .../ensemble/stacked_ensemble_classifier.py   |  2 +-
 .../ensemble/stacked_ensemble_regressor.py    |  2 +-
 .../classifiers/baseline_classifier.py        |  2 +-
 .../classifiers/catboost_classifier.py        |  5 +---
 .../classifiers/lightgbm_classifier.py        | 10 +++----
 .../regressors/baseline_regressor.py          |  3 +-
 .../regressors/lightgbm_regressor.py          |  3 +-
 .../time_series_baseline_estimator.py         |  5 ++--
 .../preprocessing/datetime_featurizer.py      |  2 +-
 .../preprocessing/featuretools.py             |  7 ++---
 .../transformers/preprocessing/lsa.py         |  2 +-
 .../preprocessing/text_transformer.py         |  2 +-
 evalml/pipelines/pipeline_base.py             |  2 +-
 .../time_series_classification_pipelines.py   |  2 +-
 .../time_series_regression_pipeline.py        |  2 +-
 evalml/preprocessing/utils.py                 |  2 +-
 evalml/tuners/skopt_tuner.py                  |  2 +-
 evalml/tuners/tuner.py                        |  2 +-
 27 files changed, 55 insertions(+), 64 deletions(-)

diff --git a/evalml/automl/automl_algorithm/automl_algorithm.py b/evalml/automl/automl_algorithm/automl_algorithm.py
index 5a91ec2ef1..06f3596580 100644
--- a/evalml/automl/automl_algorithm/automl_algorithm.py
+++ b/evalml/automl/automl_algorithm/automl_algorithm.py
@@ -25,7 +25,7 @@ def __init__(self,
             allowed_pipelines (list(class)): A list of PipelineBase subclasses indicating the pipelines allowed in the search. The default of None indicates all pipelines for this problem type are allowed.
             max_iterations (int): The maximum number of iterations to be evaluated.
             tuner_class (class): A subclass of Tuner, to be used to find parameters for each pipeline. The default of None indicates the SKOptTuner will be used.
-            random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         self.random_state = get_random_state(random_state)
         self.allowed_pipelines = allowed_pipelines or []
diff --git a/evalml/automl/automl_algorithm/iterative_algorithm.py b/evalml/automl/automl_algorithm/iterative_algorithm.py
index 8604147f07..b06849e27d 100644
--- a/evalml/automl/automl_algorithm/iterative_algorithm.py
+++ b/evalml/automl/automl_algorithm/iterative_algorithm.py
@@ -31,7 +31,7 @@ def __init__(self,
             allowed_pipelines (list(class)): A list of PipelineBase subclasses indicating the pipelines allowed in the search. The default of None indicates all pipelines for this problem type are allowed.
             max_iterations (int): The maximum number of iterations to be evaluated.
             tuner_class (class): A subclass of Tuner, to be used to find parameters for each pipeline. The default of None indicates the SKOptTuner will be used.
-            random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
             pipelines_per_batch (int): the number of pipelines to be evaluated in each batch, after the first batch.
             n_jobs (int or None): Non-negative integer describing level of parallelism used for pipelines.
             number_features (int): The number of columns in the input features.
diff --git a/evalml/automl/automl_search.py b/evalml/automl/automl_search.py
index 511b6cca01..e8155c9eb5 100644
--- a/evalml/automl/automl_search.py
+++ b/evalml/automl/automl_search.py
@@ -157,7 +157,7 @@ def __init__(self,
             additional_objectives (list): Custom set of objectives to score on.
                 Will override default objectives for problem type if not empty.
 
-            random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
 
             n_jobs (int or None): Non-negative integer describing level of parallelism used for pipelines.
                 None and 1 are equivalent. If set to -1, all CPUs are used. For n_jobs below -1, (n_cpus + 1 + n_jobs) are used.
@@ -847,7 +847,7 @@ def get_pipeline(self, pipeline_id, random_state=0):
 
         Arguments:
             pipeline_id (int): pipeline to retrieve
-            random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
 
         Returns:
             PipelineBase: untrained pipeline instance associated with the provided ID
diff --git a/evalml/automl/utils.py b/evalml/automl/utils.py
index 10ffb23cb2..399eb2b4b8 100644
--- a/evalml/automl/utils.py
+++ b/evalml/automl/utils.py
@@ -39,17 +39,17 @@ def make_data_splitter(X, y, problem_type, problem_configuration=None, n_splits=
     """Given the training data and ML problem parameters, compute a data splitting method to use during AutoML search.
 
     Arguments:
-        X (pd.DataFrame, ww.DataTable): The input training data of shape [n_samples, n_features].
-        y (pd.Series, ww.DataColumn): The target training data of length [n_samples].
-        problem_type (ProblemType): the type of machine learning problem.
+        X (ww.DataTable, pd.DataFrame): The input training data of shape [n_samples, n_features].
+        y (ww.DataColumn, pd.Series): The target training data of length [n_samples].
+        problem_type (ProblemType): The type of machine learning problem.
         problem_configuration (dict, None): Additional parameters needed to configure the search. For example,
-            in time series problems, values should be passed in for the gap and max_delay variables.
-        n_splits (int, None): the number of CV splits, if applicable. Default 3.
-        shuffle (bool): whether or not to shuffle the data before splitting, if applicable. Default True.
-        random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+            in time series problems, values should be passed in for the gap and max_delay variables. Defaults to None.
+        n_splits (int, None): The number of CV splits, if applicable. Defaults to 3.
+        shuffle (bool): Whether or not to shuffle the data before splitting, if applicable. Defaults to True.
+        random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
 
     Returns:
-        sklearn.model_selection.BaseCrossValidator: data splitting method.
+        sklearn.model_selection.BaseCrossValidator: Data splitting method.
     """
     problem_type = handle_problem_types(problem_type)
     data_splitter = None
diff --git a/evalml/data_checks/outliers_data_check.py b/evalml/data_checks/outliers_data_check.py
index dff5678157..176707476e 100644
--- a/evalml/data_checks/outliers_data_check.py
+++ b/evalml/data_checks/outliers_data_check.py
@@ -19,7 +19,7 @@ def __init__(self, random_state=0):
         """Checks if there are any outliers in the input data.
 
         Arguments:
-            random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         self.random_state = get_random_state(random_state)
 
diff --git a/evalml/model_understanding/graphs.py b/evalml/model_understanding/graphs.py
index a92be72581..47ae575b3d 100644
--- a/evalml/model_understanding/graphs.py
+++ b/evalml/model_understanding/graphs.py
@@ -293,7 +293,7 @@ def calculate_permutation_importance(pipeline, X, y, objective, n_repeats=5, n_j
         n_repeats (int): Number of times to permute a feature. Defaults to 5.
         n_jobs (int or None): Non-negative integer describing level of parallelism used for pipelines.
             None and 1 are equivalent. If set to -1, all CPUs are used. For n_jobs below -1, (n_cpus + 1 + n_jobs) are used.
-        random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+        random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
 
     Returns:
         Mean feature importance scores over 5 shuffles.
diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index a421d07c96..391ae30fa2 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -22,7 +22,7 @@ def __init__(self, parameters, random_state=0):
         Arguments:
             parameters (dict): Dictionary with component names as keys and dictionary of that component's parameters as values.
                  An empty dictionary {} implies using all default values for component parameters.
-            random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         self._encoder = LabelEncoder()
         super().__init__(parameters, random_state)
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 12f2e04738..e5858069d3 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -123,7 +123,7 @@ def _fit_transform_features_helper(self, needs_fitting, X, y=None):
         """Helper function that transforms the input data based on the component graph components.
 
         Arguments:
-            needs_fitting (bool): Determines if components should be fit.
+            needs_fitting (boolean): Determines if components should be fit.
             X (ww.DataTable, pd.DataFrame): Data of shape [n_samples, n_features]
             y (ww.DataColumn, pd.Series): The target training data of length [n_samples]. Defaults to None.
 
@@ -176,14 +176,13 @@ def _compute_features(self, component_list, X, y=None, fit=False):
         if len(component_list) == 0:
             return X
         output_cache = {}
-        original_logical_types = X.logical_types
+        input_logical_types = X.logical_types
         for component_name in component_list:
             component_instance = self.get_component(component_name)
             if not isinstance(component_instance, ComponentBase):
                 raise ValueError('All components must be instantiated before fitting or predicting')
             x_inputs = []
             y_input = None
-            merged_types_dict = {}
             for parent_input in self.get_parents(component_name):
                 if parent_input[-2:] == '.y':
                     if y_input is not None:
@@ -192,17 +191,16 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                 else:
                     parent_x = output_cache.get(parent_input, output_cache.get(f'{parent_input}.x'))
                     if isinstance(parent_x, ww.DataTable):
-                        merged_types_dict.update(parent_x.logical_types)
                         parent_x = _convert_woodwork_types_wrapper(parent_x.to_dataframe())
                     elif isinstance(parent_x, ww.DataColumn):
-                        # following what was previously here, but could probs be simplified.
-                        parent_x = pd.DataFrame(_convert_woodwork_types_wrapper(parent_x.to_series()), columns=[parent_input])
+                        parent_x = pd.Series(_convert_woodwork_types_wrapper(parent_x.to_series()), name=parent_input)
                     x_inputs.append(parent_x)
             input_x, input_y = self._consolidate_inputs(x_inputs, y_input, X, y)
-            for t in original_logical_types:
-                # numeric is special(ints, floats. ex: targetencoder.)
-                if t in input_x.columns and "numeric" not in input_x[t].semantic_tags:
-                    input_x = input_x.set_types({t: original_logical_types[t]})
+            for col in input_logical_types:
+                if (col in input_x.columns and
+                        input_logical_types[col] != input_x[col].logical_type and
+                        "numeric" not in input_x[col].semantic_tags):  # numeric is special because we may not be able to safely convert (ex: input is int, output is float)
+                    input_x = input_x.set_types({col: input_logical_types[col]})
             self.input_feature_names.update({component_name: list(input_x.columns)})
 
             if isinstance(component_instance, Transformer):
@@ -234,8 +232,8 @@ def _consolidate_inputs(x_inputs, y_input, X, y):
         Arguments:
             x_inputs (list(pd.DataFrame)): Data to be used as X input for a component
             y_input (pd.Series, None): If present, the Series to use as y input for a component, different from the original y
-            X (pd.DataFrame): The original X input, to be used if there is no parent X input
-            y (pd.Series): The original y input, to be used if there is no parent y input
+            X (ww.DataTable, pd.DataFrame): The original X input, to be used if there is no parent X input
+            y (ww.DataColumn, pd.Series): The original y input, to be used if there is no parent y input
 
         Returns:
             ww.DataTable, ww.DataColumn: The X and y transformed values to evaluate a component with
@@ -281,7 +279,7 @@ def get_estimators(self):
         """Gets a list of all the estimator components within this graph
 
         Returns:
-            list: all estimator objects within the graph
+            list: All estimator objects within the graph
         """
         if not isinstance(self.get_last_component(), ComponentBase):
             raise ValueError('Cannot get estimators until the component graph is instantiated')
@@ -294,7 +292,7 @@ def get_parents(self, component_name):
             component_name (str): Name of the child component to look up
 
         Returns:
-            list(str): iterator of parent component names
+            list(str): Iterator of parent component names
         """
         try:
             component_info = self.component_dict[component_name]
@@ -380,10 +378,10 @@ def __iter__(self):
         return self
 
     def __next__(self):
-        """Iterator for graphs, prints the components in the graph in order
+        """Iterator for graphs, retrieves the components in the graph in order
 
         Returns:
-            ComponentBase - the next component class or instance in the graph
+            ComponentBase obj: The next component class or instance in the graph
         """
         if self._i < len(self.compute_order):
             self._i += 1
diff --git a/evalml/pipelines/components/ensemble/stacked_ensemble_base.py b/evalml/pipelines/components/ensemble/stacked_ensemble_base.py
index 37437e8917..fc82b13b49 100644
--- a/evalml/pipelines/components/ensemble/stacked_ensemble_base.py
+++ b/evalml/pipelines/components/ensemble/stacked_ensemble_base.py
@@ -32,7 +32,7 @@ def __init__(self, input_pipelines=None, final_estimator=None, cv=None, n_jobs=N
                 None and 1 are equivalent. If set to -1, all CPUs are used. For n_jobs below -1, (n_cpus + 1 + n_jobs) are used.
                 Defaults to None.
                 - Note: there could be some multi-process errors thrown for values of `n_jobs != 1`. If this is the case, please use `n_jobs = 1`.
-            random_state (int, np.random.RandomState): seed for the random number generator
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         if not input_pipelines:
             raise EnsembleMissingPipelinesError("`input_pipelines` must not be None or an empty list.")
diff --git a/evalml/pipelines/components/ensemble/stacked_ensemble_classifier.py b/evalml/pipelines/components/ensemble/stacked_ensemble_classifier.py
index e94e76d8dc..8f8bc59e6a 100644
--- a/evalml/pipelines/components/ensemble/stacked_ensemble_classifier.py
+++ b/evalml/pipelines/components/ensemble/stacked_ensemble_classifier.py
@@ -37,7 +37,7 @@ def __init__(self, input_pipelines=None, final_estimator=None,
                 None and 1 are equivalent. If set to -1, all CPUs are used. For n_jobs below -1, (n_cpus + 1 + n_jobs) are used.
                 Defaults to None.
                 - Note: there could be some multi-process errors thrown for values of `n_jobs != 1`. If this is the case, please use `n_jobs = 1`.
-            random_state (int, np.random.RandomState): seed for the random number generator
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         super().__init__(input_pipelines=input_pipelines, final_estimator=final_estimator,
                          cv=cv, n_jobs=n_jobs, random_state=random_state, **kwargs)
diff --git a/evalml/pipelines/components/ensemble/stacked_ensemble_regressor.py b/evalml/pipelines/components/ensemble/stacked_ensemble_regressor.py
index 4c65e04062..93680e279d 100644
--- a/evalml/pipelines/components/ensemble/stacked_ensemble_regressor.py
+++ b/evalml/pipelines/components/ensemble/stacked_ensemble_regressor.py
@@ -36,7 +36,7 @@ def __init__(self, input_pipelines=None, final_estimator=None,
                 None and 1 are equivalent. If set to -1, all CPUs are used. For n_jobs below -1, (n_cpus + 1 + n_jobs) are used.
                 Defaults to None.
                 - Note: there could be some multi-process errors thrown for values of `n_jobs != 1`. If this is the case, please use `n_jobs = 1`.
-            random_state (int, np.random.RandomState): Seed for the random number generator
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         super().__init__(input_pipelines=input_pipelines, final_estimator=final_estimator, cv=cv,
                          n_jobs=n_jobs, random_state=random_state, **kwargs)
diff --git a/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py b/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
index a8eaa04c3c..cd53fd6fd7 100644
--- a/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
@@ -26,7 +26,7 @@ def __init__(self, strategy="mode", random_state=0, **kwargs):
 
         Arguments:
             strategy (str): Method used to predict. Valid options are "mode", "random" and "random_weighted". Defaults to "mode".
-            random_state (int, np.random.RandomState): Seed for the random number generator
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         if strategy not in ["mode", "random", "random_weighted"]:
             raise ValueError("'strategy' parameter must equal either 'mode', 'random', or 'random_weighted'")
diff --git a/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py b/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
index ee3d6d8ddd..22392c8225 100644
--- a/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/catboost_classifier.py
@@ -81,10 +81,7 @@ def predict(self, X):
             predictions = predictions.flatten()
         if self._label_encoder:
             predictions = self._label_encoder.inverse_transform(predictions.astype(np.int64))
-        if not isinstance(predictions, pd.Series):
-            predictions = pd.Series(predictions)
-        predictions = _convert_to_woodwork_structure(predictions)
-        return predictions
+        return _convert_to_woodwork_structure(predictions)
 
     @property
     def feature_importance(self):
diff --git a/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py b/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py
index cf8dfd9e31..c1cac086aa 100644
--- a/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/lightgbm_classifier.py
@@ -106,12 +106,12 @@ def fit(self, X, y=None):
 
     def predict(self, X):
         X_encoded = self._encode_categories(X)
-        predictions = super().predict(X_encoded).to_series()
-        if self._label_encoder:
-            predictions = pd.Series(self._label_encoder.inverse_transform(predictions.astype(np.int64)))
+        predictions = super().predict(X_encoded)
+        if not self._label_encoder:
+            return predictions
+        predictions = pd.Series(self._label_encoder.inverse_transform(predictions.to_series().astype(np.int64)))
         return _convert_to_woodwork_structure(predictions)
 
     def predict_proba(self, X):
         X_encoded = self._encode_categories(X)
-        prediction_proba = super().predict_proba(X_encoded)
-        return _convert_to_woodwork_structure(prediction_proba)
+        return super().predict_proba(X_encoded)
diff --git a/evalml/pipelines/components/estimators/regressors/baseline_regressor.py b/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
index 2c3b2d9723..9675c3620f 100644
--- a/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
@@ -25,8 +25,7 @@ def __init__(self, strategy="mean", random_state=0, **kwargs):
 
         Arguments:
             strategy (str): method used to predict. Valid options are "mean", "median". Defaults to "mean".
-            random_state (int, np.random.RandomState): seed for the random number generator
-
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         if strategy not in ["mean", "median"]:
             raise ValueError("'strategy' parameter must equal either 'mean' or 'median'")
diff --git a/evalml/pipelines/components/estimators/regressors/lightgbm_regressor.py b/evalml/pipelines/components/estimators/regressors/lightgbm_regressor.py
index 2ac804852b..de11eaded3 100644
--- a/evalml/pipelines/components/estimators/regressors/lightgbm_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/lightgbm_regressor.py
@@ -92,5 +92,4 @@ def fit(self, X, y=None):
 
     def predict(self, X):
         X_encoded = self._encode_categories(X)
-        predictions = super().predict(X_encoded)
-        return predictions
+        return super().predict(X_encoded)
diff --git a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
index d9307c34db..cea43991bc 100644
--- a/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
+++ b/evalml/pipelines/components/estimators/regressors/time_series_baseline_estimator.py
@@ -27,9 +27,8 @@ def __init__(self, gap=1, random_state=0, **kwargs):
         """Baseline time series estimator that predicts using the naive forecasting approach.
 
         Arguments:
-            gap (int): gap between prediction date and target date and must be a positive integer. If gap is 0, target date will be shifted ahead by 1 time period.
-            random_state (int, np.random.RandomState): seed for the random number generator
-
+            gap (int): Gap between prediction date and target date and must be a positive integer. If gap is 0, target date will be shifted ahead by 1 time period.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
 
         self._prediction_value = None
diff --git a/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py b/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
index 85af2496f7..8589c83f1c 100644
--- a/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/datetime_featurizer.py
@@ -55,7 +55,7 @@ def __init__(self, features_to_extract=None, encode_as_categories=False, random_
             features_to_extract (list): List of features to extract. Valid options include "year", "month", "day_of_week", "hour".
             encode_as_categories (bool): Whether day-of-week and month features should be encoded as pandas "category" dtype.
                 This allows OneHotEncoders to encode these features.
-            random_state (int, np.random.RandomState): Seed for the random number generator.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         if features_to_extract is None:
             features_to_extract = ["year", "month", "day_of_week", "hour"]
diff --git a/evalml/pipelines/components/transformers/preprocessing/featuretools.py b/evalml/pipelines/components/transformers/preprocessing/featuretools.py
index 683e9266e5..aa881eba08 100644
--- a/evalml/pipelines/components/transformers/preprocessing/featuretools.py
+++ b/evalml/pipelines/components/transformers/preprocessing/featuretools.py
@@ -18,7 +18,7 @@ def __init__(self, index='index', random_state=0, **kwargs):
         Arguments:
             index (string): The name of the column that contains the indices. If no column with this name exists,
                 then featuretools.EntitySet() creates a column with this name to serve as the index column. Defaults to 'index'
-            random_state (int, np.random.RandomState): seed for the random number generator
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         parameters = {"index": index}
         if not isinstance(index, str):
@@ -31,8 +31,7 @@ def __init__(self, index='index', random_state=0, **kwargs):
                          random_state=random_state)
 
     def _make_entity_set(self, X):
-        """helper method that creates and returns the entity set given the datatable X
-        """
+        """Helper method that creates and returns the entity set given the input data"""
         ft_es = EntitySet()
         if self.index not in X.columns:
             es = ft_es.entity_from_dataframe(entity_id="X", dataframe=X, index=self.index, make_index=True)
@@ -41,7 +40,7 @@ def _make_entity_set(self, X):
         return es
 
     def fit(self, X, y=None):
-        """Fits the DFSTransformer Transformer component
+        """Fits the DFSTransformer Transformer component.
 
         Arguments:
             X (ww.DataTable, pd.DataFrame, np.array): The input data to transform, of shape [n_samples, n_features]
diff --git a/evalml/pipelines/components/transformers/preprocessing/lsa.py b/evalml/pipelines/components/transformers/preprocessing/lsa.py
index 9c4da7c54d..9ae5d46c61 100644
--- a/evalml/pipelines/components/transformers/preprocessing/lsa.py
+++ b/evalml/pipelines/components/transformers/preprocessing/lsa.py
@@ -22,7 +22,7 @@ def __init__(self, text_columns=None, random_state=0, **kwargs):
 
         Arguments:
             text_columns (list): list of feature names which should be treated as text features.
-            random_state (int, np.random.RandomState): Seed for the random number generator.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         self._lsa_pipeline = make_pipeline(TfidfVectorizer(), TruncatedSVD(random_state=random_state))
         super().__init__(text_columns=text_columns,
diff --git a/evalml/pipelines/components/transformers/preprocessing/text_transformer.py b/evalml/pipelines/components/transformers/preprocessing/text_transformer.py
index 2d894be70d..66ee7e349f 100644
--- a/evalml/pipelines/components/transformers/preprocessing/text_transformer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/text_transformer.py
@@ -12,7 +12,7 @@ def __init__(self, text_columns=None, component_obj=None, random_state=0, **kwar
 
         Arguments:
             text_columns (list): list of feature names which should be treated as text features.
-            random_state (int, np.random.RandomState): Seed for the random number generator.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         parameters = {'text_columns': text_columns}
         parameters.update(kwargs)
diff --git a/evalml/pipelines/pipeline_base.py b/evalml/pipelines/pipeline_base.py
index 2a380a5ea6..afb4ad55ef 100644
--- a/evalml/pipelines/pipeline_base.py
+++ b/evalml/pipelines/pipeline_base.py
@@ -58,7 +58,7 @@ def __init__(self, parameters, random_state=0):
         Arguments:
             parameters (dict): Dictionary with component names as keys and dictionary of that component's parameters as values.
                  An empty dictionary {} implies using all default values for component parameters.
-            random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         self.random_state = get_random_state(random_state)
         if isinstance(self.component_graph, list):  # Backwards compatibility
diff --git a/evalml/pipelines/time_series_classification_pipelines.py b/evalml/pipelines/time_series_classification_pipelines.py
index fac4529ace..19e3ce826f 100644
--- a/evalml/pipelines/time_series_classification_pipelines.py
+++ b/evalml/pipelines/time_series_classification_pipelines.py
@@ -26,7 +26,7 @@ def __init__(self, parameters, random_state=0):
                  An empty dictionary {} implies using all default values for component parameters. Pipeline-level
                  parameters such as gap and max_delay must be specified with the "pipeline" key. For example:
                  Pipeline(parameters={"pipeline": {"max_delay": 4, "gap": 2}}).
-            random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         if "pipeline" not in parameters:
             raise ValueError("gap and max_delay parameters cannot be omitted from the parameters dict. "
diff --git a/evalml/pipelines/time_series_regression_pipeline.py b/evalml/pipelines/time_series_regression_pipeline.py
index 8c86ed9519..73522a7045 100644
--- a/evalml/pipelines/time_series_regression_pipeline.py
+++ b/evalml/pipelines/time_series_regression_pipeline.py
@@ -28,7 +28,7 @@ def __init__(self, parameters, random_state=0):
                  An empty dictionary {} implies using all default values for component parameters. Pipeline-level
                  parameters such as gap and max_delay must be specified with the "pipeline" key. For example:
                  Pipeline(parameters={"pipeline": {"max_delay": 4, "gap": 2}}).
-            random_state (int, np.random.RandomState): The random seed/state. Defaults to 0.
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         if "pipeline" not in parameters:
             raise ValueError("gap and max_delay parameters cannot be omitted from the parameters dict. "
diff --git a/evalml/preprocessing/utils.py b/evalml/preprocessing/utils.py
index 029eaf119a..dc2095a1ad 100644
--- a/evalml/preprocessing/utils.py
+++ b/evalml/preprocessing/utils.py
@@ -57,7 +57,7 @@ def split_data(X, y, problem_type, problem_configuration=None, test_size=.2, ran
         problem_configuration (dict, None): Additional parameters needed to configure the search. For example,
             in time series problems, values should be passed in for the gap and max_delay variables.
         test_size (float): What percentage of data points should be included in the test set. Defaults to 0.2 (20%).
-        random_state (int, np.random.RandomState): Seed for the random number generator
+        random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
 
     Returns:
         ww.DataTable, ww.DataTable, ww.DataColumn, ww.DataColumn: Feature and target data each split into train and test sets
diff --git a/evalml/tuners/skopt_tuner.py b/evalml/tuners/skopt_tuner.py
index fe9f649a54..0dc92a6019 100644
--- a/evalml/tuners/skopt_tuner.py
+++ b/evalml/tuners/skopt_tuner.py
@@ -19,7 +19,7 @@ def __init__(self, pipeline_hyperparameter_ranges, random_state=0):
 
         Arguments:
             pipeline_hyperparameter_ranges (dict): a set of hyperparameter ranges corresponding to a pipeline's parameters
-            random_state (int, np.random.RandomState): The random state
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         super().__init__(pipeline_hyperparameter_ranges, random_state=random_state)
         self.opt = Optimizer(self._search_space_ranges, "ET", acq_optimizer="sampling", random_state=random_state)
diff --git a/evalml/tuners/tuner.py b/evalml/tuners/tuner.py
index 795a940c38..a215c9fc3d 100644
--- a/evalml/tuners/tuner.py
+++ b/evalml/tuners/tuner.py
@@ -14,7 +14,7 @@ def __init__(self, pipeline_hyperparameter_ranges, random_state=0):
 
         Arguments:
             pipeline_hyperparameter_ranges (dict): a set of hyperparameter ranges corresponding to a pipeline's parameters
-            random_state (int, np.random.RandomState): The random state
+            random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
         """
         self._pipeline_hyperparameter_ranges = pipeline_hyperparameter_ranges
         self._parameter_names_map = dict()

From 23edbcede93261b529259d6f96a243d9c5b2b6ee Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 14:05:25 -0500
Subject: [PATCH 72/98] more docstring updates

---
 evalml/pipelines/binary_classification_pipeline.py       | 8 ++++----
 evalml/pipelines/classification_pipeline.py              | 6 +++---
 evalml/pipelines/pipeline_base.py                        | 4 ++--
 evalml/pipelines/time_series_classification_pipelines.py | 6 +++---
 evalml/pipelines/time_series_regression_pipeline.py      | 2 +-
 5 files changed, 13 insertions(+), 13 deletions(-)

diff --git a/evalml/pipelines/binary_classification_pipeline.py b/evalml/pipelines/binary_classification_pipeline.py
index d016322ea9..b7c93e3a85 100644
--- a/evalml/pipelines/binary_classification_pipeline.py
+++ b/evalml/pipelines/binary_classification_pipeline.py
@@ -22,11 +22,11 @@ def _predict(self, X, objective=None):
         """Make predictions using selected features.
 
         Arguments:
-            X (pd.DataFrame): Data of shape [n_samples, n_features]
+            X (ww.DataTable, pd.DataFrame): Data of shape [n_samples, n_features]
             objective (Object or string): The objective to use to make predictions
 
         Returns:
-            pd.Series: Estimated labels
+            ww.DataColumn: Estimated labels
         """
 
         if objective is not None:
@@ -46,10 +46,10 @@ def predict_proba(self, X):
         """Make probability estimates for labels. Assumes that the column at index 1 represents the positive label case.
 
         Arguments:
-            X (pd.DataFrame or np.ndarray): Data of shape [n_samples, n_features]
+            X (ww.DataTable, pd.DataFrame or np.ndarray): Data of shape [n_samples, n_features]
 
         Returns:
-            pd.DataFrame: probability estimates
+            ww.DataTable: probability estimates
         """
         return super().predict_proba(X)
 
diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index 391ae30fa2..75ae946aa3 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -88,7 +88,7 @@ def predict(self, X, objective=None):
             objective (Object or string): The objective to use to make predictions
 
         Returns:
-            pd.Series : Estimated labels
+            ww.DataColumn: Estimated labels
         """
         predictions = self._predict(X, objective).to_series()
         predictions = pd.Series(self._decode_targets(predictions), name=self.input_target_name)
@@ -101,7 +101,7 @@ def predict_proba(self, X):
             X (ww.DataTable, pd.DataFrame or np.ndarray): Data of shape [n_samples, n_features]
 
         Returns:
-            pd.DataFrame: Probability estimates
+            ww.DataTable: Probability estimates
         """
         X = self.compute_estimator_features(X, y=None)
         proba = self.estimator.predict_proba(X).to_dataframe()
@@ -132,7 +132,7 @@ def score(self, X, y, objectives):
         return self._score_all_objectives(X, y, y_predicted, y_predicted_proba, objectives)
 
     def _compute_predictions(self, X, objectives):
-        """Scan through the objectives list and precompute"""
+        """Helper function to scan through the objectives list and precompute probabilities."""
         y_predicted = None
         y_predicted_proba = None
         for objective in objectives:
diff --git a/evalml/pipelines/pipeline_base.py b/evalml/pipelines/pipeline_base.py
index afb4ad55ef..0400a81600 100644
--- a/evalml/pipelines/pipeline_base.py
+++ b/evalml/pipelines/pipeline_base.py
@@ -182,10 +182,10 @@ def compute_estimator_features(self, X, y=None):
         """Transforms the data by applying all pre-processing components.
 
         Arguments:
-            X (pd.DataFrame): Input data to the pipeline to transform.
+            X (ww.DataTable, pd.DataFrame): Input data to the pipeline to transform.
 
         Returns:
-            pd.DataFrame - New transformed features.
+            ww.DataTable: New transformed features.
         """
         X_t = self._component_graph.compute_final_component_features(X, y=y)
         return X_t
diff --git a/evalml/pipelines/time_series_classification_pipelines.py b/evalml/pipelines/time_series_classification_pipelines.py
index 19e3ce826f..971f4dab3b 100644
--- a/evalml/pipelines/time_series_classification_pipelines.py
+++ b/evalml/pipelines/time_series_classification_pipelines.py
@@ -111,7 +111,7 @@ def predict(self, X, y=None, objective=None):
             objective (Object or string): The objective to use to make predictions
 
         Returns:
-            pd.Series: Predicted values.
+            ww.DataColumn: Predicted values.
         """
         X, y = self._convert_to_woodwork(X, y)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
@@ -136,7 +136,7 @@ def predict_proba(self, X, y=None):
             X (ww.DataTable, pd.DataFrame or np.ndarray): Data of shape [n_samples, n_features]
 
         Returns:
-            pd.DataFrame: Probability estimates
+            ww.DataTable: Probability estimates
         """
         X, y = self._convert_to_woodwork(X, y)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
@@ -173,7 +173,7 @@ def score(self, X, y, objectives):
 
         Arguments:
             X (ww.DataTable, pd.DataFrame or np.ndarray): Data of shape [n_samples, n_features]
-            y (pd.Series, ww.DataColumn): True labels of length [n_samples]
+            y (ww.DataColumn, pd.Series): True labels of length [n_samples]
             objectives (list): Non-empty list of objectives to score on
 
         Returns:
diff --git a/evalml/pipelines/time_series_regression_pipeline.py b/evalml/pipelines/time_series_regression_pipeline.py
index 73522a7045..ba1e2fd77f 100644
--- a/evalml/pipelines/time_series_regression_pipeline.py
+++ b/evalml/pipelines/time_series_regression_pipeline.py
@@ -72,7 +72,7 @@ def predict(self, X, y=None, objective=None):
             objective (Object or string): The objective to use to make predictions
 
         Returns:
-            pd.Series: Predicted values.
+            ww.DataColumn: Predicted values.
         """
         if X is None:
             X = pd.DataFrame()

From 35d5972758c97c50e660ca15e81c310f8593f1e9 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 14:35:29 -0500
Subject: [PATCH 73/98] more cleanup of impl and docstrings

---
 .../binary_classification_pipeline.py         |  2 +-
 .../components/estimators/estimator.py        |  6 ++---
 .../transformers/encoders/onehot_encoder.py   | 11 ++++----
 .../time_series_classification_pipelines.py   | 27 ++++---------------
 4 files changed, 13 insertions(+), 33 deletions(-)

diff --git a/evalml/pipelines/binary_classification_pipeline.py b/evalml/pipelines/binary_classification_pipeline.py
index b7c93e3a85..c9d36d72f8 100644
--- a/evalml/pipelines/binary_classification_pipeline.py
+++ b/evalml/pipelines/binary_classification_pipeline.py
@@ -49,7 +49,7 @@ def predict_proba(self, X):
             X (ww.DataTable, pd.DataFrame or np.ndarray): Data of shape [n_samples, n_features]
 
         Returns:
-            ww.DataTable: probability estimates
+            ww.DataTable: Probability estimates
         """
         return super().predict_proba(X)
 
diff --git a/evalml/pipelines/components/estimators/estimator.py b/evalml/pipelines/components/estimators/estimator.py
index 0eda360635..cfaf35a98d 100644
--- a/evalml/pipelines/components/estimators/estimator.py
+++ b/evalml/pipelines/components/estimators/estimator.py
@@ -45,8 +45,7 @@ def predict(self, X):
             predictions = self._component_obj.predict(X)
         except AttributeError:
             raise MethodPropertyNotFoundError("Estimator requires a predict method or a component_obj that implements predict")
-        predictions = _convert_to_woodwork_structure(predictions)
-        return predictions
+        return _convert_to_woodwork_structure(predictions)
 
     def predict_proba(self, X):
         """Make probability estimates for labels.
@@ -63,8 +62,7 @@ def predict_proba(self, X):
             pred_proba = self._component_obj.predict_proba(X)
         except AttributeError:
             raise MethodPropertyNotFoundError("Estimator requires a predict_proba method or a component_obj that implements predict_proba")
-        pred_proba = _convert_to_woodwork_structure(pred_proba)
-        return pred_proba
+        return _convert_to_woodwork_structure(pred_proba)
 
     @property
     def feature_importance(self):
diff --git a/evalml/pipelines/components/transformers/encoders/onehot_encoder.py b/evalml/pipelines/components/transformers/encoders/onehot_encoder.py
index 4c732cd775..59f74cf9c8 100644
--- a/evalml/pipelines/components/transformers/encoders/onehot_encoder.py
+++ b/evalml/pipelines/components/transformers/encoders/onehot_encoder.py
@@ -123,14 +123,14 @@ def fit(self, X, y=None):
         return self
 
     def transform(self, X, y=None):
-        """One-hot encode the input DataFrame.
+        """One-hot encode the input data.
 
         Arguments:
-            X (pd.DataFrame): Dataframe of features.
-            y (pd.Series): Ignored.
+            X (ww.DataTable, pd.DataFrame): Features to one-hot encode.
+            y (ww.DataColumn, pd.Series): Ignored.
 
         Returns:
-            Transformed dataframe, where each categorical feature has been encoded into numerical columns using one-hot encoding.
+            ww.DataTable: Transformed data, where each categorical feature has been encoded into numerical columns using one-hot encoding.
         """
         X_copy = _convert_to_woodwork_structure(X)
         X_copy = _convert_woodwork_types_wrapper(X_copy.to_dataframe())
@@ -151,8 +151,7 @@ def transform(self, X, y=None):
             X_cat.columns = self.get_feature_names()
             X_t = pd.concat([X_t, X_cat], axis=1)
 
-        X_t = _convert_to_woodwork_structure(X_t)
-        return X_t
+        return _convert_to_woodwork_structure(X_t)
 
     def _handle_parameter_handle_missing(self, X):
         """Helper method to handle the `handle_missing` parameter."""
diff --git a/evalml/pipelines/time_series_classification_pipelines.py b/evalml/pipelines/time_series_classification_pipelines.py
index 971f4dab3b..33b7f2823a 100644
--- a/evalml/pipelines/time_series_classification_pipelines.py
+++ b/evalml/pipelines/time_series_classification_pipelines.py
@@ -89,14 +89,9 @@ def _estimator_predict_proba(self, features, y):
 
     def _predict(self, X, y, objective=None, pad=False):
         features = self.compute_estimator_features(X, y)
-        if isinstance(features, ww.DataTable):
-            features = _convert_woodwork_types_wrapper(features.to_dataframe())
-        elif isinstance(features, ww.DataColumn):
-            features = _convert_woodwork_types_wrapper(features.to_series())
-
+        features = _convert_woodwork_types_wrapper(features.to_dataframe())
         features_no_nan, y_no_nan = drop_rows_with_nans(features, y)
         predictions = self._estimator_predict(features_no_nan, y_no_nan)
-
         if pad:
             padded = pad_with_nans(predictions.to_series(), max(0, features.shape[0] - predictions.shape[0]))
             return _convert_to_woodwork_structure(padded)
@@ -118,14 +113,10 @@ def predict(self, X, y=None, objective=None):
         y = _convert_woodwork_types_wrapper(y.to_series())
         n_features = max(len(y), X.shape[0])
         predictions = self._predict(X, y, objective=objective, pad=False)
-        if isinstance(predictions, ww.DataTable):
-            predictions = _convert_woodwork_types_wrapper(predictions.to_dataframe())
-        elif isinstance(predictions, ww.DataColumn):
-            predictions = _convert_woodwork_types_wrapper(predictions.to_series())
+        predictions = _convert_woodwork_types_wrapper(predictions.to_series())
         # In case gap is 0 and this is a baseline pipeline, we drop the nans in the
         # predictions before decoding them
         predictions = pd.Series(self._decode_targets(predictions.dropna()), name=self.input_target_name)
-
         padded = pad_with_nans(predictions, max(0, n_features - predictions.shape[0]))
         return _convert_to_woodwork_structure(padded)
 
@@ -142,10 +133,7 @@ def predict_proba(self, X, y=None):
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         y = _convert_woodwork_types_wrapper(y.to_series())
         features = self.compute_estimator_features(X, y)
-        if isinstance(features, ww.DataTable):
-            features = _convert_woodwork_types_wrapper(features.to_dataframe())
-        elif isinstance(features, ww.DataColumn):
-            features = _convert_woodwork_types_wrapper(features.to_series())
+        features = _convert_woodwork_types_wrapper(features.to_dataframe())
         features_no_nan, y_no_nan = drop_rows_with_nans(features, y)
         proba = self._estimator_predict_proba(features_no_nan, y_no_nan).to_dataframe()
         proba.columns = self._encoder.classes_
@@ -207,11 +195,7 @@ def threshold(self, value):
 
     def _predict(self, X, y, objective=None, pad=False):
         features = self.compute_estimator_features(X, y)
-        if isinstance(features, ww.DataTable):
-            features = _convert_woodwork_types_wrapper(features.to_dataframe())
-        elif isinstance(features, ww.DataColumn):
-            features = _convert_woodwork_types_wrapper(features.to_series())
-
+        features = _convert_woodwork_types_wrapper(features.to_dataframe())
         features_no_nan, y_no_nan = drop_rows_with_nans(features, y)
 
         if objective is not None:
@@ -229,8 +213,7 @@ def _predict(self, X, y, objective=None, pad=False):
             else:
                 predictions = objective.decision_function(proba, threshold=self.threshold, X=features_no_nan)
         if pad:
-            padded = pad_with_nans(predictions, max(0, features.shape[0] - predictions.shape[0]))
-            return _convert_to_woodwork_structure(padded)
+            predictions = pad_with_nans(predictions, max(0, features.shape[0] - predictions.shape[0]))
         return _convert_to_woodwork_structure(predictions)
 
     @staticmethod

From 96505ecdcd7f6572398675bb463f192110771599 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 14:51:54 -0500
Subject: [PATCH 74/98] more cleanup

---
 .../components/estimators/estimator.py          |  4 ++--
 .../transformers/encoders/target_encoder.py     |  2 +-
 .../feature_selection/feature_selector.py       |  7 ++-----
 .../components/transformers/imputers/imputer.py |  5 ++---
 .../transformers/imputers/per_column_imputer.py | 17 +----------------
 .../transformers/imputers/simple_imputer.py     |  3 +--
 .../preprocessing/text_featurizer.py            |  3 +--
 .../transformers/scalers/standard_scaler.py     |  4 +---
 .../components/transformers/transformer.py      |  7 ++-----
 .../time_series_regression_pipeline.py          |  9 ++-------
 10 files changed, 15 insertions(+), 46 deletions(-)

diff --git a/evalml/pipelines/components/estimators/estimator.py b/evalml/pipelines/components/estimators/estimator.py
index cfaf35a98d..fcb78041bc 100644
--- a/evalml/pipelines/components/estimators/estimator.py
+++ b/evalml/pipelines/components/estimators/estimator.py
@@ -37,7 +37,7 @@ def predict(self, X):
             X (ww.DataTable, pd.DataFrame, or np.ndarray): Data of shape [n_samples, n_features]
 
         Returns:
-            pd.Series: Predicted values
+            ww.DataColumn: Predicted values
         """
         try:
             X = _convert_to_woodwork_structure(X)
@@ -54,7 +54,7 @@ def predict_proba(self, X):
             X (ww.DataTable, pd.DataFrame, or np.ndarray): Features
 
         Returns:
-            pd.DataFrame: Probability estimates
+            ww.DataTable: Probability estimates
         """
         try:
             X = _convert_to_woodwork_structure(X)
diff --git a/evalml/pipelines/components/transformers/encoders/target_encoder.py b/evalml/pipelines/components/transformers/encoders/target_encoder.py
index e7bbbe10f2..1e28a1bcfe 100644
--- a/evalml/pipelines/components/transformers/encoders/target_encoder.py
+++ b/evalml/pipelines/components/transformers/encoders/target_encoder.py
@@ -52,7 +52,7 @@ def __init__(self,
                          random_state=random_state)
 
     def fit(self, X, y):
-        # do we want to do this?
+        # TODO do we want to do this?
         if isinstance(X, pd.DataFrame):
             X.reset_index(drop=True, inplace=True)
         if isinstance(y, pd.Series):
diff --git a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
index 7690ee097a..bb4a61c268 100644
--- a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
+++ b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
@@ -23,8 +23,8 @@ def transform(self, X, y=None):
         """Transforms input data by selecting features.
 
         Arguments:
-            X (pd.DataFrame): Data to transform
-            y (pd.Series, optional): Target data
+            X (ww.DataTable, pd.DataFrame): Data to transform
+            y (ww.DataColumn, pd.Series, optional): Target data. Ignored.
 
         Returns:
             ww.DataTable: Transformed X
@@ -43,6 +43,3 @@ def transform(self, X, y=None):
         col_types = {key: X_dtypes[key] for key in selected_col_names}
         features = pd.DataFrame(X_t, columns=selected_col_names, index=X.index).astype(col_types)
         return _convert_to_woodwork_structure(features)
-
-    def fit_transform(self, X, y=None):
-        return self.fit(X, y).transform(X, y)
diff --git a/evalml/pipelines/components/transformers/imputers/imputer.py b/evalml/pipelines/components/transformers/imputers/imputer.py
index ddcdcdfdaa..a80cf67bba 100644
--- a/evalml/pipelines/components/transformers/imputers/imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/imputer.py
@@ -101,8 +101,7 @@ def transform(self, X, y=None):
         X_null_dropped = X.copy()
         X_null_dropped.drop(self._all_null_cols, inplace=True, axis=1, errors='ignore')
         if X_null_dropped.empty:
-            X_null_dropped = _convert_to_woodwork_structure(X_null_dropped)
-            return X_null_dropped
+            return _convert_to_woodwork_structure(X_null_dropped)
 
         if self._numeric_cols is not None and len(self._numeric_cols) > 0:
             X_numeric = X_null_dropped[self._numeric_cols]
@@ -113,6 +112,6 @@ def transform(self, X, y=None):
             X_categorical = X_null_dropped[self._categorical_cols]
             imputed = self._categorical_imputer.transform(X_categorical).to_dataframe()
             X_null_dropped[X_categorical.columns] = imputed
-        X_null_dropped = _convert_to_woodwork_structure(X_null_dropped)
 
+        X_null_dropped = _convert_to_woodwork_structure(X_null_dropped)
         return X_null_dropped
diff --git a/evalml/pipelines/components/transformers/imputers/per_column_imputer.py b/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
index e5508ee433..f8782c1c41 100644
--- a/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/per_column_imputer.py
@@ -86,19 +86,4 @@ def transform(self, X, y=None):
             else:
                 X_t[column] = transformed[column]
         X_t = X_t.drop(cols_to_drop, axis=1)
-        X_t = _convert_to_woodwork_structure(X_t)
-        return X_t
-
-    def fit_transform(self, X, y=None):
-        """Fits imputer and imputes missing values in input data.
-
-        Arguments:
-            X (ww.DataTable, pd.DataFrame or np.ndarray): The input training data of shape [n_samples, n_features] to transform.
-            y (ww.DataColumn, pd.Series, optional): The target training data of length [n_samples]. Ignored.
-
-        Returns:
-            ww.DataTable: Transformed X
-        """
-
-        self.fit(X, y)
-        return self.transform(X, y)
+        return _convert_to_woodwork_structure(X_t)
diff --git a/evalml/pipelines/components/transformers/imputers/simple_imputer.py b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
index 71f8ed2b6f..9e4a6ab973 100644
--- a/evalml/pipelines/components/transformers/imputers/simple_imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/simple_imputer.py
@@ -56,8 +56,7 @@ def fit(self, X, y=None):
         return self
 
     def transform(self, X, y=None):
-        """Transforms data X by imputing missing values. 'None' values are converted to np.nan before imputation and are
-            treated as the same.
+        """Transforms input by imputing missing values. 'None' and np.nan values are treated as the same.
 
         Arguments:
             X (ww.DataTable, pd.DataFrame): Data to transform
diff --git a/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py b/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
index 1c99bf9a23..894350fc74 100644
--- a/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/text_featurizer.py
@@ -108,5 +108,4 @@ def transform(self, X, y=None):
         X_lsa = self._lsa.transform(X[text_columns]).to_dataframe()
         X_nlp_primitives.set_index(X.index, inplace=True)
         X_t = pd.concat([X.drop(text_columns, axis=1), X_nlp_primitives, X_lsa], axis=1)
-        X_t = _convert_to_woodwork_structure(X_t)
-        return X_t
+        return _convert_to_woodwork_structure(X_t)
diff --git a/evalml/pipelines/components/transformers/scalers/standard_scaler.py b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
index b4f1a364dd..3eee1a9d0b 100644
--- a/evalml/pipelines/components/transformers/scalers/standard_scaler.py
+++ b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
@@ -26,10 +26,8 @@ def transform(self, X, y=None):
 
         X = _convert_to_woodwork_structure(X)
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
-        X_cols = X.columns
-        X_index = X.index
         X_t = self._component_obj.transform(X)
-        X_t_df = pd.DataFrame(X_t, columns=X_cols, index=X_index)
+        X_t_df = pd.DataFrame(X_t, columns=X.columns, index=X.index)
         return _convert_to_woodwork_structure(X_t_df)
 
     def fit_transform(self, X, y=None):
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index ff4b403bf4..3a1959b3cb 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -40,15 +40,12 @@ def transform(self, X, y=None):
             if y is not None:
                 y = _convert_to_woodwork_structure(y)
                 y = _convert_woodwork_types_wrapper(y.to_series())
-            X_cols = X.columns
-            X_index = X.index
             # category treated differently from object...
             X_t = self._component_obj.transform(X, y)
         except AttributeError:
             raise MethodPropertyNotFoundError("Transformer requires a transform method or a component_obj that implements transform")
-        # if isinstance(X, pd.DataFrame):
-            # return _convert_to_woodwork_structure(pd.DataFrame(X_t, columns=X.columns, index=X.index))
-        X_t_df = pd.DataFrame(X_t, columns=X_cols, index=X_index)
+
+        X_t_df = pd.DataFrame(X_t, columns=X.columns, index=X.index)
         return _convert_to_woodwork_structure(X_t_df)
 
     def fit_transform(self, X, y=None):
diff --git a/evalml/pipelines/time_series_regression_pipeline.py b/evalml/pipelines/time_series_regression_pipeline.py
index ba1e2fd77f..a8e8ef1fbf 100644
--- a/evalml/pipelines/time_series_regression_pipeline.py
+++ b/evalml/pipelines/time_series_regression_pipeline.py
@@ -81,17 +81,12 @@ def predict(self, X, y=None, objective=None):
         X = _convert_woodwork_types_wrapper(X.to_dataframe())
         y = _convert_woodwork_types_wrapper(y.to_series())
         features = self.compute_estimator_features(X, y)
-        if isinstance(features, ww.DataTable):
-            features = _convert_woodwork_types_wrapper(features.to_dataframe())
-        elif isinstance(features, ww.DataColumn):
-            features = _convert_woodwork_types_wrapper(features.to_series())
-
+        features = _convert_woodwork_types_wrapper(features.to_dataframe())
         features_no_nan, y = drop_rows_with_nans(features, y)
         y_arg = None
         if self.estimator.predict_uses_y:
             y_arg = y
-        predictions = self.estimator.predict(features_no_nan, y_arg)
-        predictions = predictions.to_series()
+        predictions = self.estimator.predict(features_no_nan, y_arg).to_series()
         predictions = predictions.rename(self.input_target_name)
         padded = pad_with_nans(predictions, max(0, features.shape[0] - predictions.shape[0]))
         return _convert_to_woodwork_structure(padded)

From 17ed8bef8898a61c42cd262de2897d251be6d9f2 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 14:57:48 -0500
Subject: [PATCH 75/98] some cleanup of unnecessary code in standard scaler

---
 .../transformers/scalers/standard_scaler.py   | 38 +++++++++----------
 .../components/transformers/transformer.py    | 10 ++---
 .../time_series_classification_pipelines.py   |  6 +--
 3 files changed, 27 insertions(+), 27 deletions(-)

diff --git a/evalml/pipelines/components/transformers/scalers/standard_scaler.py b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
index 3eee1a9d0b..226747632d 100644
--- a/evalml/pipelines/components/transformers/scalers/standard_scaler.py
+++ b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
@@ -22,22 +22,22 @@ def __init__(self, random_state=0, **kwargs):
                          component_obj=scaler,
                          random_state=random_state)
 
-    def transform(self, X, y=None):
-
-        X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
-        X_t = self._component_obj.transform(X)
-        X_t_df = pd.DataFrame(X_t, columns=X.columns, index=X.index)
-        return _convert_to_woodwork_structure(X_t_df)
-
-    def fit_transform(self, X, y=None):
-        return self.fit(X, y).transform(X, y)
-
-    def fit(self, X, y=None):
-        X = _convert_to_woodwork_structure(X)
-        X = _convert_woodwork_types_wrapper(X.to_dataframe())
-        if y is not None:
-            y = _convert_to_woodwork_structure(y)
-            y = _convert_woodwork_types_wrapper(y.to_series())
-        self._component_obj.fit(X, y)
-        return self
+    # def transform(self, X, y=None):
+
+    #     X = _convert_to_woodwork_structure(X)
+    #     X = _convert_woodwork_types_wrapper(X.to_dataframe())
+    #     X_t = self._component_obj.transform(X)
+    #     X_t_df = pd.DataFrame(X_t, columns=X.columns, index=X.index)
+    #     return _convert_to_woodwork_structure(X_t_df)
+
+    # def fit_transform(self, X, y=None):
+    #     return self.fit(X, y).transform(X, y)
+
+    # def fit(self, X, y=None):
+    #     X = _convert_to_woodwork_structure(X)
+    #     X = _convert_woodwork_types_wrapper(X.to_dataframe())
+    #     if y is not None:
+    #         y = _convert_to_woodwork_structure(y)
+    #         y = _convert_woodwork_types_wrapper(y.to_series())
+    #     self._component_obj.fit(X, y)
+    #     return self
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 3a1959b3cb..3df1a5bc0d 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -59,11 +59,11 @@ def fit_transform(self, X, y=None):
             ww.DataTable: Transformed X
         """
         try:
-            X2 = _convert_to_woodwork_structure(X)
-            y2 = _convert_to_woodwork_structure(y)
-            X2 = _convert_woodwork_types_wrapper(X2.to_dataframe())
-            y2 = _convert_woodwork_types_wrapper(y2.to_series())
-            X_t = self._component_obj.fit_transform(X2, y2)
+            X = _convert_to_woodwork_structure(X)
+            y = _convert_to_woodwork_structure(y)
+            X = _convert_woodwork_types_wrapper(X.to_dataframe())
+            y = _convert_woodwork_types_wrapper(y.to_series())
+            X_t = self._component_obj.fit_transform(X, y)
         except AttributeError:
             try:
                 self.fit(X, y)
diff --git a/evalml/pipelines/time_series_classification_pipelines.py b/evalml/pipelines/time_series_classification_pipelines.py
index 33b7f2823a..ec4f5622ff 100644
--- a/evalml/pipelines/time_series_classification_pipelines.py
+++ b/evalml/pipelines/time_series_classification_pipelines.py
@@ -149,11 +149,11 @@ def _compute_predictions(self, X, y, objectives):
         if any(not o.score_needs_proba for o in objectives):
             y_predicted = self._predict(X, y, pad=True)
 
-        if isinstance(y_predicted_proba, ww.DataTable):
+        if y_predicted_proba is not None:
             y_predicted_proba = _convert_woodwork_types_wrapper(y_predicted_proba.to_dataframe())
-
-        if isinstance(y_predicted, ww.DataColumn):
+        if y_predicted is not None:
             y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
+
         return y_predicted, y_predicted_proba
 
     def score(self, X, y, objectives):

From 11645724664765a5b540e517ed6057197d1fcc16 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 15:00:41 -0500
Subject: [PATCH 76/98] make classification and time series classification
 predict same

---
 evalml/pipelines/classification_pipeline.py    | 10 ++++------
 .../time_series_classification_pipelines.py    | 18 ++++++++----------
 2 files changed, 12 insertions(+), 16 deletions(-)

diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index 75ae946aa3..b17f4de0ef 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -126,7 +126,6 @@ def score(self, X, y, objectives):
         y_predicted, y_predicted_proba = self._compute_predictions(X, objectives)
         if y_predicted is not None:
             y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
-
         if y_predicted_proba is not None:
             y_predicted_proba = _convert_woodwork_types_wrapper(y_predicted_proba.to_dataframe())
         return self._score_all_objectives(X, y, y_predicted, y_predicted_proba, objectives)
@@ -135,9 +134,8 @@ def _compute_predictions(self, X, objectives):
         """Helper function to scan through the objectives list and precompute probabilities."""
         y_predicted = None
         y_predicted_proba = None
-        for objective in objectives:
-            if objective.score_needs_proba and y_predicted_proba is None:
-                y_predicted_proba = self.predict_proba(X)
-            if not objective.score_needs_proba and y_predicted is None:
-                y_predicted = self._predict(X)
+        if any(o.score_needs_proba for o in objectives):
+            y_predicted_proba = self.predict_proba(X)
+        if any(not o.score_needs_proba for o in objectives):
+            y_predicted = self._predict(X)
         return y_predicted, y_predicted_proba
diff --git a/evalml/pipelines/time_series_classification_pipelines.py b/evalml/pipelines/time_series_classification_pipelines.py
index ec4f5622ff..ec14409687 100644
--- a/evalml/pipelines/time_series_classification_pipelines.py
+++ b/evalml/pipelines/time_series_classification_pipelines.py
@@ -148,12 +148,6 @@ def _compute_predictions(self, X, y, objectives):
             y_predicted_proba = self.predict_proba(X, y)
         if any(not o.score_needs_proba for o in objectives):
             y_predicted = self._predict(X, y, pad=True)
-
-        if y_predicted_proba is not None:
-            y_predicted_proba = _convert_woodwork_types_wrapper(y_predicted_proba.to_dataframe())
-        if y_predicted is not None:
-            y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
-
         return y_predicted, y_predicted_proba
 
     def score(self, X, y, objectives):
@@ -174,10 +168,14 @@ def score(self, X, y, objectives):
 
         y_encoded = self._encode_targets(y)
         y_shifted = y_encoded.shift(-self.gap)
-        y_pred, y_pred_proba = self._compute_predictions(X, y, objectives)
-        y_shifted, y_pred, y_pred_proba = drop_rows_with_nans(y_shifted, y_pred, y_pred_proba)
-        return self._score_all_objectives(X, y_shifted, y_pred,
-                                          y_pred_proba=y_pred_proba,
+        y_predicted, y_predicted_proba = self._compute_predictions(X, y, objectives)
+        if y_predicted is not None:
+            y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
+        if y_predicted_proba is not None:
+            y_predicted_proba = _convert_woodwork_types_wrapper(y_predicted_proba.to_dataframe())
+        y_shifted, y_predicted, y_predicted_proba = drop_rows_with_nans(y_shifted, y_predicted, y_predicted_proba)
+        return self._score_all_objectives(X, y_shifted, y_predicted,
+                                          y_pred_proba=y_predicted_proba,
                                           objectives=objectives)
 
 
From f88392ddea9fe3323545ceffbbf89cfd88cf9a17 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 15:41:03 -0500
Subject: [PATCH 77/98] fix tests and more cleanup

---
 .../feature_selection/feature_selector.py     |  3 ++
 .../transformers/scalers/standard_scaler.py   | 28 ++++++------------
 .../components/transformers/transformer.py    |  2 +-
 .../time_series_classification_pipelines.py   |  2 --
 .../time_series_regression_pipeline.py        |  1 -
 .../test_baseline_classifier.py               |  2 --
 .../test_drop_null_columns_transformer.py     |  2 +-
 evalml/tests/component_tests/test_imputer.py  | 29 +++++++------------
 .../component_tests/test_simple_imputer.py    | 12 ++++----
 .../test_multicollinearity_data_check.py      |  6 ++--
 .../model_understanding_tests/test_graphs.py  |  9 ++----
 .../test_time_series_pipeline.py              | 10 ++++---
 12 files changed, 41 insertions(+), 65 deletions(-)

diff --git a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
index bb4a61c268..e3086fdd1a 100644
--- a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
+++ b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
@@ -43,3 +43,6 @@ def transform(self, X, y=None):
         col_types = {key: X_dtypes[key] for key in selected_col_names}
         features = pd.DataFrame(X_t, columns=selected_col_names, index=X.index).astype(col_types)
         return _convert_to_woodwork_structure(features)
+
+    def fit_transform(self, X, y=None):
+        return self.fit(X, y).transform(X, y)
diff --git a/evalml/pipelines/components/transformers/scalers/standard_scaler.py b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
index 226747632d..6a6737babc 100644
--- a/evalml/pipelines/components/transformers/scalers/standard_scaler.py
+++ b/evalml/pipelines/components/transformers/scalers/standard_scaler.py
@@ -22,22 +22,12 @@ def __init__(self, random_state=0, **kwargs):
                          component_obj=scaler,
                          random_state=random_state)
 
-    # def transform(self, X, y=None):
-
-    #     X = _convert_to_woodwork_structure(X)
-    #     X = _convert_woodwork_types_wrapper(X.to_dataframe())
-    #     X_t = self._component_obj.transform(X)
-    #     X_t_df = pd.DataFrame(X_t, columns=X.columns, index=X.index)
-    #     return _convert_to_woodwork_structure(X_t_df)
-
-    # def fit_transform(self, X, y=None):
-    #     return self.fit(X, y).transform(X, y)
-
-    # def fit(self, X, y=None):
-    #     X = _convert_to_woodwork_structure(X)
-    #     X = _convert_woodwork_types_wrapper(X.to_dataframe())
-    #     if y is not None:
-    #         y = _convert_to_woodwork_structure(y)
-    #         y = _convert_woodwork_types_wrapper(y.to_series())
-    #     self._component_obj.fit(X, y)
-    #     return self
+    def transform(self, X, y=None):
+        X = _convert_to_woodwork_structure(X)
+        X = _convert_woodwork_types_wrapper(X.to_dataframe())
+        X_t = self._component_obj.transform(X)
+        X_t_df = pd.DataFrame(X_t, columns=X.columns, index=X.index)
+        return _convert_to_woodwork_structure(X_t_df)
+
+    def fit_transform(self, X, y=None):
+        return self.fit(X, y).transform(X, y)
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 3df1a5bc0d..4babb2388a 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -41,7 +41,7 @@ def transform(self, X, y=None):
                 y = _convert_to_woodwork_structure(y)
                 y = _convert_woodwork_types_wrapper(y.to_series())
             # category treated differently from object...
-            X_t = self._component_obj.transform(X, y)
+                X_t = self._component_obj.transform(X, y)
         except AttributeError:
             raise MethodPropertyNotFoundError("Transformer requires a transform method or a component_obj that implements transform")
 
diff --git a/evalml/pipelines/time_series_classification_pipelines.py b/evalml/pipelines/time_series_classification_pipelines.py
index ec14409687..45aae8211a 100644
--- a/evalml/pipelines/time_series_classification_pipelines.py
+++ b/evalml/pipelines/time_series_classification_pipelines.py
@@ -1,5 +1,4 @@
 import pandas as pd
-import woodwork as ww
 
 from evalml.objectives import get_objective
 from evalml.pipelines.classification_pipeline import ClassificationPipeline
@@ -84,7 +83,6 @@ def _estimator_predict_proba(self, features, y):
         y_arg = None
         if self.estimator.predict_uses_y:
             y_arg = y
-
         return self.estimator.predict_proba(features, y=y_arg)
 
     def _predict(self, X, y, objective=None, pad=False):
diff --git a/evalml/pipelines/time_series_regression_pipeline.py b/evalml/pipelines/time_series_regression_pipeline.py
index a8e8ef1fbf..7cfc4a13b5 100644
--- a/evalml/pipelines/time_series_regression_pipeline.py
+++ b/evalml/pipelines/time_series_regression_pipeline.py
@@ -1,5 +1,4 @@
 import pandas as pd
-import woodwork as ww
 
 from evalml.objectives import get_objective
 from evalml.pipelines.regression_pipeline import RegressionPipeline
diff --git a/evalml/tests/component_tests/test_baseline_classifier.py b/evalml/tests/component_tests/test_baseline_classifier.py
index c2bfe60a56..ceca215d0c 100644
--- a/evalml/tests/component_tests/test_baseline_classifier.py
+++ b/evalml/tests/component_tests/test_baseline_classifier.py
@@ -114,7 +114,6 @@ def test_baseline_multiclass_random(X_y_multi):
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
     assert_frame_equal(pd.DataFrame(np.array([[1. / 3 for i in range(len(values))]] * len(X))), predicted_proba.to_dataframe())
-    # np.testing.assert_allclose(predicted_proba, )
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -130,7 +129,6 @@ def test_baseline_multiclass_random_weighted(X_y_multi):
     predictions = clf.predict(X)
     assert_series_equal(pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64"), predictions.to_series())
 
-    # np.testing.assert_allclose(clf.predict(X), get_random_state(0).choice(np.unique(y), len(X), p=percent_freq))
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
     assert_frame_equal(pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X))), predicted_proba.to_dataframe())
diff --git a/evalml/tests/component_tests/test_drop_null_columns_transformer.py b/evalml/tests/component_tests/test_drop_null_columns_transformer.py
index 2fe1cba719..763968a5e0 100644
--- a/evalml/tests/component_tests/test_drop_null_columns_transformer.py
+++ b/evalml/tests/component_tests/test_drop_null_columns_transformer.py
@@ -104,7 +104,7 @@ def test_drop_null_transformer_fit_transform():
                       'some_null': [None, 0, 3, 4, 5]})
     drop_null_transformer = DropNullColumns(pct_null_threshold=1.0)
     X_t = drop_null_transformer.fit_transform(X)
-    assert_frame_equal(X_t.to_dataframe(), X.drop(["all_null"], axis=1))
+    assert_frame_equal(X.drop(["all_null"], axis=1), X_t.to_dataframe())
 
 
 def test_drop_null_transformer_np_array():
diff --git a/evalml/tests/component_tests/test_imputer.py b/evalml/tests/component_tests/test_imputer.py
index e2df993bdd..d295d45e0d 100644
--- a/evalml/tests/component_tests/test_imputer.py
+++ b/evalml/tests/component_tests/test_imputer.py
@@ -1,7 +1,6 @@
 import numpy as np
 import pandas as pd
 import pytest
-import woodwork as ww
 from pandas.testing import assert_frame_equal
 
 from evalml.pipelines.components import Imputer
@@ -183,19 +182,12 @@ def test_imputer_datetime_input():
 
 
 @pytest.mark.parametrize("data_type", ['np', 'pd', 'ww'])
-def test_imputer_empty_data(data_type):
-    if data_type == 'pd':
-        X = pd.DataFrame()
-        y = pd.Series()
-        expected = pd.DataFrame(index=pd.Index([]), columns=pd.Index([]))
-    elif data_type == 'ww':
-        X = ww.DataTable(pd.DataFrame())
-        y = ww.DataColumn(pd.Series())
-        expected = pd.DataFrame(index=pd.Index([]), columns=pd.Index([]))
-    else:
-        X = np.array([[]])
-        y = np.array([])
-        expected = pd.DataFrame(index=pd.Index([0]), columns=pd.Int64Index([]))
+def test_imputer_empty_data(data_type, make_data_type):
+    X = pd.DataFrame()
+    y = pd.Series()
+    X = make_data_type(data_type, X)
+    y = make_data_type(data_type, y)
+    expected = pd.DataFrame(index=pd.Index([]), columns=pd.Index([]))
     imputer = Imputer()
     imputer.fit(X, y)
     transformed = imputer.transform(X, y)
@@ -317,7 +309,7 @@ def test_imputer_bool_dtype_object(data_type, make_data_type):
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
-def test_imputer_multitype_with_one_bool(data_type):
+def test_imputer_multitype_with_one_bool(data_type, make_data_type):
     X_multi = pd.DataFrame({
         "bool with nan": pd.Series([True, np.nan, False, np.nan, False], dtype=object),
         "bool no nan": pd.Series([False, False, False, False, True], dtype=bool),
@@ -327,9 +319,10 @@ def test_imputer_multitype_with_one_bool(data_type):
         "bool with nan": pd.Series([True, False, False, False, False], dtype='boolean'),
         "bool no nan": pd.Series([False, False, False, False, True], dtype='boolean'),
     })
-    if data_type == 'ww':
-        X_multi = ww.DataTable(X_multi)
-        y = ww.DataColumn(y)
+
+    X_multi = make_data_type(data_type, X_multi)
+    y = make_data_type(data_type, y)
+
     imputer = Imputer()
     imputer.fit(X_multi, y)
     X_multi_t = imputer.transform(X_multi)
diff --git a/evalml/tests/component_tests/test_simple_imputer.py b/evalml/tests/component_tests/test_simple_imputer.py
index 1ac31cefdf..bb8395dd12 100644
--- a/evalml/tests/component_tests/test_simple_imputer.py
+++ b/evalml/tests/component_tests/test_simple_imputer.py
@@ -1,7 +1,6 @@
 import numpy as np
 import pandas as pd
 import pytest
-import woodwork as ww
 from pandas.testing import assert_frame_equal
 
 from evalml.pipelines.components import SimpleImputer
@@ -117,12 +116,11 @@ def test_simple_imputer_all_bool_return_original(data_type, make_data_type):
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
-def test_simple_imputer_bool_dtype_object(data_type):
+def test_simple_imputer_bool_dtype_object(data_type, make_data_type):
     X = pd.DataFrame([True, np.nan, False, np.nan, True], dtype=object)
     y = pd.Series([1, 0, 0, 1, 0])
     X_expected_arr = pd.DataFrame([True, True, False, True, True], dtype='boolean')
-    if data_type == 'ww':
-        X = ww.DataTable(X)
+    X = make_data_type(data_type, X)
     imputer = SimpleImputer()
     imputer.fit(X, y)
     X_t = imputer.transform(X)
@@ -130,7 +128,7 @@ def test_simple_imputer_bool_dtype_object(data_type):
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
-def test_simple_imputer_multitype_with_one_bool(data_type):
+def test_simple_imputer_multitype_with_one_bool(data_type, make_data_type):
     X_multi = pd.DataFrame({
         "bool with nan": pd.Series([True, np.nan, False, np.nan, False], dtype=object),
         "bool no nan": pd.Series([False, False, False, False, True], dtype=bool),
@@ -140,8 +138,8 @@ def test_simple_imputer_multitype_with_one_bool(data_type):
         "bool with nan": pd.Series([True, False, False, False, False], dtype='boolean'),
         "bool no nan": pd.Series([False, False, False, False, True], dtype='boolean'),
     })
-    if data_type == 'ww':
-        X_multi = ww.DataTable(X_multi)
+    X_multi = make_data_type(data_type, X_multi)
+
     imputer = SimpleImputer()
     imputer.fit(X_multi, y)
     X_multi_t = imputer.transform(X_multi)
diff --git a/evalml/tests/data_checks_tests/test_multicollinearity_data_check.py b/evalml/tests/data_checks_tests/test_multicollinearity_data_check.py
index 126a828a78..29097619dd 100644
--- a/evalml/tests/data_checks_tests/test_multicollinearity_data_check.py
+++ b/evalml/tests/data_checks_tests/test_multicollinearity_data_check.py
@@ -1,6 +1,5 @@
 import pandas as pd
 import pytest
-import woodwork as ww
 
 from evalml.data_checks import (
     DataCheckMessageCode,
@@ -52,7 +51,7 @@ def test_multicollinearity_returns_warning():
 
 
 @pytest.mark.parametrize("data_type", ['pd', 'ww'])
-def test_multicollinearity_nonnumeric_cols(data_type):
+def test_multicollinearity_nonnumeric_cols(data_type, make_data_type):
     X = pd.DataFrame({'col_1': ["a", "b", "c", "d", "a"],
                       'col_2': ["w", "x", "y", "z", "b"],
                       'col_3': ["a", "a", "c", "d", "a"],
@@ -60,8 +59,7 @@ def test_multicollinearity_nonnumeric_cols(data_type):
                       'col_5': ["0", "0", "1", "2", "0"],
                       'col_6': [1, 1, 2, 3, 1]
                       })
-    if data_type == 'ww':
-        X = ww.DataTable(X)
+    X = make_data_type(data_type, X)
     multi_check = MulticollinearityDataCheck(threshold=0.9)
     assert multi_check.validate(X) == {
         "warnings": [DataCheckWarning(message="Columns are likely to be correlated: [('col_1', 'col_4'), ('col_3', 'col_5'), ('col_3', 'col_6'), ('col_5', 'col_6'), ('col_1', 'col_2'), ('col_2', 'col_4')]",
diff --git a/evalml/tests/model_understanding_tests/test_graphs.py b/evalml/tests/model_understanding_tests/test_graphs.py
index 3d867efd39..408f9a17f2 100644
--- a/evalml/tests/model_understanding_tests/test_graphs.py
+++ b/evalml/tests/model_understanding_tests/test_graphs.py
@@ -298,12 +298,8 @@ def test_roc_curve_binary(data_type, make_data_type):
 
     y_true = np.array([1, 1, 0, 0])
     y_predict_proba = np.array([[0.9, 0.1], [0.6, 0.4], [0.65, 0.35], [0.2, 0.8]])
-    if data_type != 'np':
-        y_true = pd.Series(y_true)
-        y_predict_proba = pd.DataFrame(y_predict_proba)
-    if data_type == 'ww':
-        y_true = ww.DataColumn(y_true)
-        y_predict_proba = ww.DataTable(y_predict_proba)
+    y_predict_proba = make_data_type(data_type, y_predict_proba)
+    y_true = make_data_type(data_type, y_true)
 
     roc_curve_data = roc_curve(y_true, y_predict_proba)[0]
     fpr_rates = roc_curve_data.get('fpr_rates')
@@ -349,6 +345,7 @@ def test_roc_curve_multiclass(data_type, make_data_type):
     y_true_unique = y_true
     if data_type == 'ww':
         y_true_unique = y_true.to_series()
+
     for i in np.unique(y_true_unique):
         fpr_rates = roc_curve_data[i].get('fpr_rates')
         tpr_rates = roc_curve_data[i].get('tpr_rates')
diff --git a/evalml/tests/pipeline_tests/test_time_series_pipeline.py b/evalml/tests/pipeline_tests/test_time_series_pipeline.py
index 69d077f72d..512009f61c 100644
--- a/evalml/tests/pipeline_tests/test_time_series_pipeline.py
+++ b/evalml/tests/pipeline_tests/test_time_series_pipeline.py
@@ -4,6 +4,7 @@
 import pandas as pd
 import pytest
 import woodwork as ww
+from pandas.testing import assert_frame_equal, assert_series_equal
 
 from evalml.pipelines import (
     TimeSeriesBinaryClassificationPipeline,
@@ -232,21 +233,22 @@ class MyTsPipeline(pipeline_class):
     df_passed_to_estimator, target_passed_to_estimator = mock_fit.call_args[0]
 
     # Check the features have target values encoded as ints.
-    pd.testing.assert_frame_equal(df_passed_to_estimator, answer)
+    assert_frame_equal(df_passed_to_estimator, answer)
 
     # Check that target is converted to ints. Use .iloc[1:] because the first feature row has NaNs
-    pd.testing.assert_series_equal(target_passed_to_estimator, y_series.iloc[1:])
+    assert_series_equal(target_passed_to_estimator, y_series.iloc[1:])
 
     pl.predict(X, y_encoded)
     # Best way to get the argument since the api changes between 3.6/3.7 and 3.8
     df_passed_to_predict = mock_predict.call_args[0][0]
-    pd.testing.assert_frame_equal(df_passed_to_predict, answer)
+    assert_frame_equal(df_passed_to_predict, answer)
 
     mock_predict.reset_mock()
+
     # Since we mock score_all_objectives, the objective doesn't matter
     pl.score(X, y_encoded, objectives=['MCC Binary'])
     df_passed_to_predict = mock_predict.call_args[0][0]
-    pd.testing.assert_frame_equal(df_passed_to_predict, answer)
+    assert_frame_equal(df_passed_to_predict, answer)
 
 
 @pytest.mark.parametrize("pipeline_class,objectives", [(TimeSeriesBinaryClassificationPipeline, ["MCC Binary"]),

From 8ec9d01d604757440eb3cc21e731600bc5a481a9 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 15:53:51 -0500
Subject: [PATCH 78/98] oops fix test

---
 evalml/pipelines/components/transformers/transformer.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 4babb2388a..3df1a5bc0d 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -41,7 +41,7 @@ def transform(self, X, y=None):
                 y = _convert_to_woodwork_structure(y)
                 y = _convert_woodwork_types_wrapper(y.to_series())
             # category treated differently from object...
-                X_t = self._component_obj.transform(X, y)
+            X_t = self._component_obj.transform(X, y)
         except AttributeError:
             raise MethodPropertyNotFoundError("Transformer requires a transform method or a component_obj that implements transform")
 

From 7a4aae5046c2331cab3c328a39f6def47ad13824 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 16:48:21 -0500
Subject: [PATCH 79/98] oops fix imputer

---
 .../components/transformers/imputers/imputer.py      |  3 +++
 evalml/tests/pipeline_tests/test_component_graph.py  | 12 ++++++------
 2 files changed, 9 insertions(+), 6 deletions(-)

diff --git a/evalml/pipelines/components/transformers/imputers/imputer.py b/evalml/pipelines/components/transformers/imputers/imputer.py
index a80cf67bba..c49973c8e2 100644
--- a/evalml/pipelines/components/transformers/imputers/imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/imputer.py
@@ -115,3 +115,6 @@ def transform(self, X, y=None):
 
         X_null_dropped = _convert_to_woodwork_structure(X_null_dropped)
         return X_null_dropped
+
+    def fit_transform(self, X, y=None):
+        return self.fit(X, y).transform(X, y)
diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index efeb7fd61f..a4ce971e5b 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -356,8 +356,8 @@ def test_fit(mock_predict, mock_fit, mock_fit_transform, example_graph, X_y_bina
 
 
 @patch('evalml.pipelines.components.Imputer.fit_transform')
-@patch('evalml.pipelines.components.OneHotEncoder.transform')
-def test_fit_correct_inputs(mock_ohe_transform, mock_imputer_fit_transform, X_y_binary):
+@patch('evalml.pipelines.components.OneHotEncoder.fit_transform')
+def test_fit_correct_inputs(mock_ohe_fit_transform, mock_imputer_fit_transform, X_y_binary):
     X, y = X_y_binary
     X = pd.DataFrame(X)
     y = pd.Series(y)
@@ -365,12 +365,12 @@ def test_fit_correct_inputs(mock_ohe_transform, mock_imputer_fit_transform, X_y_
     expected_x = ww.DataTable(pd.DataFrame(index=X.index, columns=X.index).fillna(1))
     expected_y = ww.DataColumn(pd.Series(index=y.index).fillna(0))
     mock_imputer_fit_transform.return_value = tuple((expected_x, expected_y))
-    mock_ohe_transform.return_value = expected_x
+    mock_ohe_fit_transform.return_value = expected_x
     component_graph = ComponentGraph(graph).instantiate({})
     component_graph.fit(X, y)
-
-    assert_frame_equal(expected_x.to_dataframe(), mock_ohe_transform.call_args[0][0].to_dataframe())
-    assert_series_equal(expected_y.to_series(), mock_ohe_transform.call_args[0][1].to_series())
+    expected_x_df = expected_x.to_dataframe().astype("Int64")
+    assert_frame_equal(expected_x_df, mock_ohe_fit_transform.call_args[0][0].to_dataframe())
+    assert_series_equal(expected_y.to_series(), mock_ohe_fit_transform.call_args[0][1].to_series())
 
 
 @patch('evalml.pipelines.components.Transformer.fit_transform')

From 37594b34650e97a89b28ea293f83d543a169c91e Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 17:22:19 -0500
Subject: [PATCH 80/98] actually fixing tests

---
 .../components/transformers/imputers/imputer.py          | 4 ++--
 evalml/pipelines/components/transformers/transformer.py  | 9 ++++-----
 evalml/tests/pipeline_tests/test_component_graph.py      | 7 +++----
 3 files changed, 9 insertions(+), 11 deletions(-)

diff --git a/evalml/pipelines/components/transformers/imputers/imputer.py b/evalml/pipelines/components/transformers/imputers/imputer.py
index c49973c8e2..ccd33a3d28 100644
--- a/evalml/pipelines/components/transformers/imputers/imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/imputer.py
@@ -116,5 +116,5 @@ def transform(self, X, y=None):
         X_null_dropped = _convert_to_woodwork_structure(X_null_dropped)
         return X_null_dropped
 
-    def fit_transform(self, X, y=None):
-        return self.fit(X, y).transform(X, y)
+    # def fit_transform(self, X, y=None):
+    #     return self.fit(X, y).transform(X, y)
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 3df1a5bc0d..3da96b0a32 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -61,13 +61,12 @@ def fit_transform(self, X, y=None):
         try:
             X = _convert_to_woodwork_structure(X)
             y = _convert_to_woodwork_structure(y)
-            X = _convert_woodwork_types_wrapper(X.to_dataframe())
-            y = _convert_woodwork_types_wrapper(y.to_series())
-            X_t = self._component_obj.fit_transform(X, y)
+            X_pd = _convert_woodwork_types_wrapper(X.to_dataframe())
+            y_pd = _convert_woodwork_types_wrapper(y.to_series())
+            X_t = self._component_obj.fit_transform(X_pd, y_pd)
         except AttributeError:
             try:
-                self.fit(X, y)
-                X_t = self.transform(X, y)
+                return self.fit(X, y).transform(X, y)
             except MethodPropertyNotFoundError as e:
                 raise e
         return _convert_to_woodwork_structure(X_t)
diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index a4ce971e5b..0c458f4d63 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -345,8 +345,8 @@ def test_get_last_component(example_graph):
 @patch('evalml.pipelines.components.Estimator.predict')
 def test_fit(mock_predict, mock_fit, mock_fit_transform, example_graph, X_y_binary):
     X, y = X_y_binary
-    mock_fit_transform.return_value = pd.DataFrame(X)
-    mock_predict.return_value = pd.Series(y)
+    mock_fit_transform.return_value = ww.DataTable(X)
+    mock_predict.return_value = ww.DataColumn(y)
     component_graph = ComponentGraph(example_graph).instantiate({})
     component_graph.fit(X, y)
 
@@ -382,8 +382,7 @@ def test_fit_features(mock_predict, mock_fit, mock_fit_transform, X_y_binary):
     component_graph = ComponentGraph.from_list(component_list)
     component_graph.instantiate({})
 
-    mock_X_t = pd.DataFrame(np.ones(X.shape))
-    mock_fit_transform.return_value = ww.DataTable(mock_X_t)
+    mock_fit_transform.return_value = ww.DataTable(np.ones(X.shape))
     mock_fit.return_value = Estimator
     mock_predict.return_value = ww.DataColumn(y)
 

From 66c04f46eff941f953bd467cefb6d62d7a8049ec Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 17:40:02 -0500
Subject: [PATCH 81/98] fix delayed feature transformer not returning

---
 .../transformers/preprocessing/delayed_feature_transformer.py    | 1 +
 1 file changed, 1 insertion(+)

diff --git a/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py b/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
index 4258066ce6..a5adcd7c5d 100644
--- a/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
@@ -44,6 +44,7 @@ def __init__(self, max_delay=2, delay_features=True, delay_target=True, gap=1,
 
     def fit(self, X, y=None):
         """Fits the DelayFeatureTransformer."""
+        return self
 
     @staticmethod
     def _encode_y_while_preserving_index(y):

From 61d0ac0733efdf5ff37efa71159e14216d7ca9ed Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 18:07:03 -0500
Subject: [PATCH 82/98] clean up mock

---
 .../pipelines/components/transformers/transformer.py   | 10 ++++------
 evalml/tests/component_tests/test_components.py        |  2 +-
 2 files changed, 5 insertions(+), 7 deletions(-)

diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index 3da96b0a32..b0f1344d18 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -40,11 +40,9 @@ def transform(self, X, y=None):
             if y is not None:
                 y = _convert_to_woodwork_structure(y)
                 y = _convert_woodwork_types_wrapper(y.to_series())
-            # category treated differently from object...
             X_t = self._component_obj.transform(X, y)
         except AttributeError:
             raise MethodPropertyNotFoundError("Transformer requires a transform method or a component_obj that implements transform")
-
         X_t_df = pd.DataFrame(X_t, columns=X.columns, index=X.index)
         return _convert_to_woodwork_structure(X_t_df)
 
@@ -59,10 +57,10 @@ def fit_transform(self, X, y=None):
             ww.DataTable: Transformed X
         """
         try:
-            X = _convert_to_woodwork_structure(X)
-            y = _convert_to_woodwork_structure(y)
-            X_pd = _convert_woodwork_types_wrapper(X.to_dataframe())
-            y_pd = _convert_woodwork_types_wrapper(y.to_series())
+            X_ww = _convert_to_woodwork_structure(X)
+            y_ww = _convert_to_woodwork_structure(y)
+            X_pd = _convert_woodwork_types_wrapper(X_ww.to_dataframe())
+            y_pd = _convert_woodwork_types_wrapper(y_ww.to_series())
             X_t = self._component_obj.fit_transform(X_pd, y_pd)
         except AttributeError:
             try:
diff --git a/evalml/tests/component_tests/test_components.py b/evalml/tests/component_tests/test_components.py
index 0142cf1612..69f0da4b63 100644
--- a/evalml/tests/component_tests/test_components.py
+++ b/evalml/tests/component_tests/test_components.py
@@ -253,7 +253,7 @@ class MockTransformerWithFit(Transformer):
         name = "Mock Transformer"
 
         def fit(self, X, y=None):
-            return X
+            return self
 
     component = MockComponent()
     with pytest.raises(MethodPropertyNotFoundError, match="Component requires a fit method or a component_obj that implements fit"):

From 93940454fa2dde6051e5c3236fc84264c448463c Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 18:42:08 -0500
Subject: [PATCH 83/98] combine prediction compution to one function

---
 evalml/pipelines/classification_pipeline.py          |  8 ++++----
 .../time_series_classification_pipelines.py          | 12 +-----------
 2 files changed, 5 insertions(+), 15 deletions(-)

diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index b17f4de0ef..3b3509f47e 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -130,12 +130,12 @@ def score(self, X, y, objectives):
             y_predicted_proba = _convert_woodwork_types_wrapper(y_predicted_proba.to_dataframe())
         return self._score_all_objectives(X, y, y_predicted, y_predicted_proba, objectives)
 
-    def _compute_predictions(self, X, objectives):
-        """Helper function to scan through the objectives list and precompute probabilities."""
+    def _compute_predictions(self, X, y, objectives, time_series=False):
+        """Compute predictions/probabilities based on objectives."""
         y_predicted = None
         y_predicted_proba = None
         if any(o.score_needs_proba for o in objectives):
-            y_predicted_proba = self.predict_proba(X)
+            y_predicted_proba = self.predict_proba(X, y) if time_series else self.predict_proba(X)
         if any(not o.score_needs_proba for o in objectives):
-            y_predicted = self._predict(X)
+            y_predicted = self._predict(X, y, pad=True) if time_series else self._predict(X)
         return y_predicted, y_predicted_proba
diff --git a/evalml/pipelines/time_series_classification_pipelines.py b/evalml/pipelines/time_series_classification_pipelines.py
index 45aae8211a..c0e5b7adfd 100644
--- a/evalml/pipelines/time_series_classification_pipelines.py
+++ b/evalml/pipelines/time_series_classification_pipelines.py
@@ -138,16 +138,6 @@ def predict_proba(self, X, y=None):
         padded = pad_with_nans(proba, max(0, features.shape[0] - proba.shape[0]))
         return _convert_to_woodwork_structure(padded)
 
-    def _compute_predictions(self, X, y, objectives):
-        """Compute predictions/probabilities based on objectives."""
-        y_predicted = None
-        y_predicted_proba = None
-        if any(o.score_needs_proba for o in objectives):
-            y_predicted_proba = self.predict_proba(X, y)
-        if any(not o.score_needs_proba for o in objectives):
-            y_predicted = self._predict(X, y, pad=True)
-        return y_predicted, y_predicted_proba
-
     def score(self, X, y, objectives):
         """Evaluate model performance on current and additional objectives.
 
@@ -166,7 +156,7 @@ def score(self, X, y, objectives):
 
         y_encoded = self._encode_targets(y)
         y_shifted = y_encoded.shift(-self.gap)
-        y_predicted, y_predicted_proba = self._compute_predictions(X, y, objectives)
+        y_predicted, y_predicted_proba = self._compute_predictions(X, y, objectives, time_series=True)
         if y_predicted is not None:
             y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
         if y_predicted_proba is not None:

From e7233f7be7daae04402d92bc4ece5922fef591c1 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Thu, 21 Jan 2021 19:03:10 -0500
Subject: [PATCH 84/98] oops, fix typo

---
 evalml/pipelines/classification_pipeline.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/evalml/pipelines/classification_pipeline.py b/evalml/pipelines/classification_pipeline.py
index 3b3509f47e..b8a1d44141 100644
--- a/evalml/pipelines/classification_pipeline.py
+++ b/evalml/pipelines/classification_pipeline.py
@@ -123,7 +123,7 @@ def score(self, X, y, objectives):
         y = _convert_woodwork_types_wrapper(y.to_series())
         objectives = [get_objective(o, return_instance=True) for o in objectives]
         y = self._encode_targets(y)
-        y_predicted, y_predicted_proba = self._compute_predictions(X, objectives)
+        y_predicted, y_predicted_proba = self._compute_predictions(X, y, objectives)
         if y_predicted is not None:
             y_predicted = _convert_woodwork_types_wrapper(y_predicted.to_series())
         if y_predicted_proba is not None:

From 6af7dfb4a4f714fac4877c91ce142b717a096d83 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 22 Jan 2021 00:24:53 -0500
Subject: [PATCH 85/98] some final touchups

---
 .../transformers/encoders/target_encoder.py       |  1 -
 .../components/transformers/imputers/imputer.py   |  3 ---
 .../preprocessing/delayed_feature_transformer.py  | 10 +++++++++-
 .../components/transformers/preprocessing/lsa.py  |  3 +--
 .../components/transformers/transformer.py        |  2 +-
 evalml/preprocessing/utils.py                     |  2 +-
 evalml/tests/automl_tests/test_automl.py          | 15 ---------------
 .../test_column_selector_transformers.py          |  2 +-
 evalml/tests/component_tests/test_components.py   |  2 +-
 .../component_tests/test_per_column_imputer.py    |  8 ++++----
 .../regression_pipeline_tests/test_regression.py  |  2 --
 11 files changed, 18 insertions(+), 32 deletions(-)

diff --git a/evalml/pipelines/components/transformers/encoders/target_encoder.py b/evalml/pipelines/components/transformers/encoders/target_encoder.py
index 1e28a1bcfe..386ef6f9b0 100644
--- a/evalml/pipelines/components/transformers/encoders/target_encoder.py
+++ b/evalml/pipelines/components/transformers/encoders/target_encoder.py
@@ -52,7 +52,6 @@ def __init__(self,
                          random_state=random_state)
 
     def fit(self, X, y):
-        # TODO do we want to do this?
         if isinstance(X, pd.DataFrame):
             X.reset_index(drop=True, inplace=True)
         if isinstance(y, pd.Series):
diff --git a/evalml/pipelines/components/transformers/imputers/imputer.py b/evalml/pipelines/components/transformers/imputers/imputer.py
index ccd33a3d28..a80cf67bba 100644
--- a/evalml/pipelines/components/transformers/imputers/imputer.py
+++ b/evalml/pipelines/components/transformers/imputers/imputer.py
@@ -115,6 +115,3 @@ def transform(self, X, y=None):
 
         X_null_dropped = _convert_to_woodwork_structure(X_null_dropped)
         return X_null_dropped
-
-    # def fit_transform(self, X, y=None):
-    #     return self.fit(X, y).transform(X, y)
diff --git a/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py b/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
index a5adcd7c5d..2de90de63b 100644
--- a/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
@@ -43,7 +43,15 @@ def __init__(self, max_delay=2, delay_features=True, delay_target=True, gap=1,
         super().__init__(parameters=parameters, random_state=random_state)
 
     def fit(self, X, y=None):
-        """Fits the DelayFeatureTransformer."""
+        """Fits the DelayFeatureTransformer.
+
+        Arguments:
+            X (ww.DataTable, pd.DataFrame or np.ndarray): the input training data of shape [n_samples, n_features]
+            y (ww.DataColumn, pd.Series, optional): the target training data of length [n_samples]
+
+        Returns:
+            self
+        """
         return self
 
     @staticmethod
diff --git a/evalml/pipelines/components/transformers/preprocessing/lsa.py b/evalml/pipelines/components/transformers/preprocessing/lsa.py
index 9ae5d46c61..bff9d1fc16 100644
--- a/evalml/pipelines/components/transformers/preprocessing/lsa.py
+++ b/evalml/pipelines/components/transformers/preprocessing/lsa.py
@@ -64,5 +64,4 @@ def transform(self, X, y=None):
             X_t['LSA({})[0]'.format(col)] = pd.Series(transformed[:, 0], index=X.index)
             X_t['LSA({})[1]'.format(col)] = pd.Series(transformed[:, 1], index=X.index)
         X_t = X_t.drop(columns=text_columns)
-        X_t = _convert_to_woodwork_structure(X_t)
-        return X_t
+        return _convert_to_woodwork_structure(X_t)
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index b0f1344d18..ead4c3a5ed 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -64,7 +64,7 @@ def fit_transform(self, X, y=None):
             X_t = self._component_obj.fit_transform(X_pd, y_pd)
         except AttributeError:
             try:
-                return self.fit(X, y).transform(X, y)
+                X_t = self.fit(X, y).transform(X, y)
             except MethodPropertyNotFoundError as e:
                 raise e
         return _convert_to_woodwork_structure(X_t)
diff --git a/evalml/preprocessing/utils.py b/evalml/preprocessing/utils.py
index dc2095a1ad..93d71c966a 100644
--- a/evalml/preprocessing/utils.py
+++ b/evalml/preprocessing/utils.py
@@ -54,7 +54,7 @@ def split_data(X, y, problem_type, problem_configuration=None, test_size=.2, ran
         X (ww.Datatable, pd.Dataframe or np.ndarray): data of shape [n_samples, n_features]
         y (ww.Datacolumn, pd.Series, or np.ndarray): target data of length [n_samples]
         problem_type (str or ProblemTypes): type of supervised learning problem. see evalml.problem_types.problemtype.all_problem_types for a full list.
-        problem_configuration (dict, None): Additional parameters needed to configure the search. For example,
+        problem_configuration (dict): Additional parameters needed to configure the search. For example,
             in time series problems, values should be passed in for the gap and max_delay variables.
         test_size (float): What percentage of data points should be included in the test set. Defaults to 0.2 (20%).
         random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
diff --git a/evalml/tests/automl_tests/test_automl.py b/evalml/tests/automl_tests/test_automl.py
index 385f413ea2..af6e16f8e1 100644
--- a/evalml/tests/automl_tests/test_automl.py
+++ b/evalml/tests/automl_tests/test_automl.py
@@ -416,21 +416,6 @@ def test_automl_bad_data_check_parameter_type():
         automl.search(data_checks=[MockDataCheckErrorAndWarning])
 
 
-# I don't think this tests what the name implies....
-# @patch('evalml.pipelines.RegressionPipeline.fit')
-# @patch('evalml.pipelines.RegressionPipeline.predict')
-# @patch('evalml.data_checks.InvalidTargetDataCheck')
-# def test_automl_passes_correct_objective_name_to_invalid_target_data_checks(mock_obj, mock_predict, mock_fit, X_y_regression):
-#     X, y = X_y_regression
-#     mock_obj.objective_name.return_value = "R2"
-#     mock_predict.return_value = ww.DataColumn(pd.Series([0] * len(y)))
-#     automl = AutoMLSearch(X, y, max_iterations=1, problem_type=ProblemTypes.REGRESSION)
-#     automl.search()
-#     mock_fit.assert_called()
-#     mock_predict.assert_called()
-#     assert automl.objective.name == mock_obj.objective_name.return_value
-
-
 class MockDataCheckObjective(DataCheck):
     def __init__(self, objective):
         self.objective_name = get_objective(objective).name
diff --git a/evalml/tests/component_tests/test_column_selector_transformers.py b/evalml/tests/component_tests/test_column_selector_transformers.py
index 2cec634b43..5fb8a9f2e3 100644
--- a/evalml/tests/component_tests/test_column_selector_transformers.py
+++ b/evalml/tests/component_tests/test_column_selector_transformers.py
@@ -113,7 +113,7 @@ def test_drop_column_transformer_input_invalid_col_name(class_to_test):
                                            pd.DataFrame(np.arange(12).reshape(3, 4), dtype="Int64"),
                                            pd.DataFrame([[], [], []], dtype="Int64")])
                           ])
-def test_column_transformer_int_col_names(class_to_test, answers):
+def test_column_transformer_int_col_names_np_array(class_to_test, answers):
     X = np.arange(12).reshape(3, 4)
     answer1, answer2, answer3 = answers
 
diff --git a/evalml/tests/component_tests/test_components.py b/evalml/tests/component_tests/test_components.py
index 69f0da4b63..b2d02e1155 100644
--- a/evalml/tests/component_tests/test_components.py
+++ b/evalml/tests/component_tests/test_components.py
@@ -632,7 +632,7 @@ def fit(self, X, y):
             pass
 
         def transform(self, X, y=None):
-            return pd.DataFrame()
+            return ww.DataTable(X)
 
     class MockTransformer(Transformer):
         name = "Mock Transformer"
diff --git a/evalml/tests/component_tests/test_per_column_imputer.py b/evalml/tests/component_tests/test_per_column_imputer.py
index d2d508ac85..f4e8737562 100644
--- a/evalml/tests/component_tests/test_per_column_imputer.py
+++ b/evalml/tests/component_tests/test_per_column_imputer.py
@@ -32,9 +32,9 @@ def test_all_strategies():
                       "C": pd.Series([6, 8, 8, np.nan]),
                       "D": pd.Series(["a", "a", "b", np.nan])})
 
-    X_expected = pd.DataFrame({"A": pd.Series([2, 4, 6, 4], dtype="int64"),
-                               "B": pd.Series([4, 6, 4, 4], dtype="int64"),
-                               "C": pd.Series([6, 8, 8, 100], dtype="int64"),
+    X_expected = pd.DataFrame({"A": pd.Series([2, 4, 6, 4]),
+                               "B": pd.Series([4, 6, 4, 4]),
+                               "C": pd.Series([6, 8, 8, 100]),
                                "D": pd.Series(["a", "a", "b", "a"], dtype="category")})
 
     strategies = {
@@ -126,7 +126,7 @@ def test_non_numeric_valid(non_numeric_df):
                                "C": pd.Series(["a", "b", "a", "a"], dtype="category"),
                                "D": pd.Series(["a", "b", "a", 100], dtype="category")})
     X_t = transformer.fit_transform(X)
-    assert_frame_equal(X_expected, X_t.to_dataframe(), check_dtype=False)
+    assert_frame_equal(X_expected, X_t.to_dataframe())
 
 
 def test_fit_transform_drop_all_nan_columns():
diff --git a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
index a73bacebb3..a1cd87cacd 100644
--- a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
+++ b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_regression.py
@@ -27,8 +27,6 @@ def test_woodwork_regression_pipeline(linear_regression_pipeline_class):
 
 
 def test_custom_indices():
-    # custom regression pipeline
-    # don't need to use target encoder, which wont run on core dependencies true tests
     class MyPipeline(RegressionPipeline):
         component_graph = ['Imputer', 'One Hot Encoder', 'Linear Regressor']
         custom_name = "My Pipeline"

From c163d9887a1398f95bdddcb0177184eea2e2f310 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 22 Jan 2021 01:39:40 -0500
Subject: [PATCH 86/98] docstring update

---
 evalml/preprocessing/utils.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/evalml/preprocessing/utils.py b/evalml/preprocessing/utils.py
index 93d71c966a..a0bd7f618f 100644
--- a/evalml/preprocessing/utils.py
+++ b/evalml/preprocessing/utils.py
@@ -51,8 +51,8 @@ def split_data(X, y, problem_type, problem_configuration=None, test_size=.2, ran
     """Splits data into train and test sets.
 
     Arguments:
-        X (ww.Datatable, pd.Dataframe or np.ndarray): data of shape [n_samples, n_features]
-        y (ww.Datacolumn, pd.Series, or np.ndarray): target data of length [n_samples]
+        X (ww.DataTable, pd.DataFrame or np.ndarray): data of shape [n_samples, n_features]
+        y (ww.DataColumn, pd.Series, or np.ndarray): target data of length [n_samples]
         problem_type (str or ProblemTypes): type of supervised learning problem. see evalml.problem_types.problemtype.all_problem_types for a full list.
         problem_configuration (dict): Additional parameters needed to configure the search. For example,
             in time series problems, values should be passed in for the gap and max_delay variables.

From 9ecbacedebe70ad8b41823e4a4e5d00d09e9efc1 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Fri, 22 Jan 2021 03:29:10 -0500
Subject: [PATCH 87/98] updating component graph impl and adding test

---
 evalml/pipelines/component_graph.py           | 11 +++++-----
 .../pipeline_tests/test_component_graph.py    | 22 +++++++++++++++++++
 2 files changed, 27 insertions(+), 6 deletions(-)

diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index e5858069d3..c09fba8bc9 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -176,7 +176,6 @@ def _compute_features(self, component_list, X, y=None, fit=False):
         if len(component_list) == 0:
             return X
         output_cache = {}
-        input_logical_types = X.logical_types
         for component_name in component_list:
             component_instance = self.get_component(component_name)
             if not isinstance(component_instance, ComponentBase):
@@ -196,11 +195,11 @@ def _compute_features(self, component_list, X, y=None, fit=False):
                         parent_x = pd.Series(_convert_woodwork_types_wrapper(parent_x.to_series()), name=parent_input)
                     x_inputs.append(parent_x)
             input_x, input_y = self._consolidate_inputs(x_inputs, y_input, X, y)
-            for col in input_logical_types:
-                if (col in input_x.columns and
-                        input_logical_types[col] != input_x[col].logical_type and
-                        "numeric" not in input_x[col].semantic_tags):  # numeric is special because we may not be able to safely convert (ex: input is int, output is float)
-                    input_x = input_x.set_types({col: input_logical_types[col]})
+            col_intersection = set(X.columns.keys()).intersection(set(input_x.columns.keys()))
+            for col in col_intersection:
+                if (X[col].logical_type != input_x[col].logical_type and
+                        "numeric" not in X[col].semantic_tags):  # numeric is special because we may not be able to safely convert (ex: input is int, output is float)
+                    input_x = input_x.set_types({col: X[col].logical_type})
             self.input_feature_names.update({component_name: list(input_x.columns)})
 
             if isinstance(component_instance, Transformer):
diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index 0c458f4d63..dca0134268 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -21,6 +21,7 @@
     RandomForestClassifier,
     Transformer
 )
+from evalml.utils.gen_utils import infer_feature_types
 
 
 class DummyTransformer(Transformer):
@@ -675,3 +676,24 @@ def test_iteration(example_graph):
     expected = [Imputer(), OneHotEncoder(), ElasticNetClassifier(), OneHotEncoder(top_n=32), RandomForestClassifier(), LogisticRegressionClassifier()]
     iteration = [component for component in component_graph]
     assert iteration == expected
+
+
+def test_custom_input_feature_types(example_graph):
+    X = pd.DataFrame({'column_1': ['a', 'b', 'c', 'd', 'a', 'a', 'b', 'c', 'b'],
+                      'column_2': [1, 2, 3, 4, 5, 6, 5, 4, 3]})
+    y = pd.Series([1, 0, 1, 0, 1, 1, 0, 0, 0])
+    X = infer_feature_types(X, {"column_2": "categorical"})
+
+    component_graph = ComponentGraph(example_graph)
+    component_graph.instantiate({'OneHot_RandomForest': {'top_n': 2},
+                                 'OneHot_ElasticNet': {'top_n': 3}})
+    assert component_graph.input_feature_names == {}
+    component_graph.fit(X, y)
+
+    input_feature_names = component_graph.input_feature_names
+    assert input_feature_names['Imputer'] == ['column_1', 'column_2']
+    assert input_feature_names['OneHot_RandomForest'] == ['column_1', 'column_2']
+    assert input_feature_names['OneHot_ElasticNet'] == ['column_1', 'column_2']
+    assert input_feature_names['Random Forest'] == ['column_1_a', 'column_1_b', 'column_2_3', 'column_2_4']
+    assert input_feature_names['Elastic Net'] == ['column_1_a', 'column_1_b', 'column_1_c', 'column_2_3', 'column_2_4', 'column_2_5']
+    assert input_feature_names['Logistic Regression'] == ['Random Forest', 'Elastic Net']

From 6c1ef8982a1d3557b3049d79456ae4bc598b163d Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Mon, 25 Jan 2021 18:26:52 -0500
Subject: [PATCH 88/98] fix docs

---
 evalml/pipelines/component_graph.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 2d91d57238..6e98088692 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -199,7 +199,7 @@ def _compute_features(self, component_list, X, y=None, fit=False):
             col_intersection = set(X.columns.keys()).intersection(set(input_x.columns.keys()))
             for col in col_intersection:
                 if (X[col].logical_type != input_x[col].logical_type and
-                        "numeric" not in X[col].semantic_tags):  # numeric is special because we may not be able to safely convert (ex: input is int, output is float)
+                        "numeric" not in X[col].semantic_tags and "numeric" not in input_x[col].semantic_tags):  # numeric is special because we may not be able to safely convert (ex: input is int, output is float)
                     input_x = input_x.set_types({col: X[col].logical_type})
             self.input_feature_names.update({component_name: list(input_x.columns)})
 

From 94ad165c387935097d96d5b51be7ef2611dc595a Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 26 Jan 2021 00:25:47 -0500
Subject: [PATCH 89/98] fi

---
 evalml/pipelines/component_graph.py           | 10 ++++--
 .../pipeline_tests/test_component_graph.py    | 35 +++++++++++++++++++
 2 files changed, 43 insertions(+), 2 deletions(-)

diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index 6e98088692..139429d203 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -199,8 +199,14 @@ def _compute_features(self, component_list, X, y=None, fit=False):
             col_intersection = set(X.columns.keys()).intersection(set(input_x.columns.keys()))
             for col in col_intersection:
                 if (X[col].logical_type != input_x[col].logical_type and
-                        "numeric" not in X[col].semantic_tags and "numeric" not in input_x[col].semantic_tags):  # numeric is special because we may not be able to safely convert (ex: input is int, output is float)
-                    input_x = input_x.set_types({col: X[col].logical_type})
+                        "numeric" not in X[col].semantic_tags):  # numeric is special because we may not be able to safely convert (ex: input is int, output is float)
+                    try:
+                        input_x = input_x.set_types({col: X[col].logical_type})
+                    except TypeError:
+                        # if there is a column whose type has been converted s.t. it cannot be converted back, keep as is.
+                        # example: StandardScaler could convert a boolean column to a float column. This is expected, and we should not
+                        # try to convert back to boolean.
+                        continue
             self.input_feature_names.update({component_name: list(input_x.columns)})
 
             if isinstance(component_instance, Transformer):
diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index dca0134268..ca27e2016c 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -697,3 +697,38 @@ def test_custom_input_feature_types(example_graph):
     assert input_feature_names['Random Forest'] == ['column_1_a', 'column_1_b', 'column_2_3', 'column_2_4']
     assert input_feature_names['Elastic Net'] == ['column_1_a', 'column_1_b', 'column_1_c', 'column_2_3', 'column_2_4', 'column_2_5']
     assert input_feature_names['Logistic Regression'] == ['Random Forest', 'Elastic Net']
+
+from evalml.pipelines.components import DateTimeFeaturizer, StandardScaler
+def test_component_graph_dataset_with_different_types():
+    graph = {'Imputer': [Imputer],
+             'OneHot': [OneHotEncoder, 'Imputer.x'],
+             'DateTime': [DateTimeFeaturizer, 'OneHot.x'],
+             'Scaler': [StandardScaler, 'DateTime.x'],
+             'Random Forest': [RandomForestClassifier, 'Scaler.x'],
+             'Elastic Net': [ElasticNetClassifier, 'Scaler.x'],
+             'Logistic Regression': [LogisticRegressionClassifier, 'Random Forest', 'Elastic Net']}
+
+    X = pd.DataFrame({'column_1': ['a', 'b', 'c', 'd', 'a', 'a', 'b', 'c', 'b'],
+                      'column_2': [1, 2, 3, 4, 5, 6, 5, 4, 3],
+                      'column_3': [True, False, True, False, True, False, True, False, False]})
+    y = pd.Series([1, 0, 1, 0, 1, 1, 0, 0, 0])
+    X = infer_feature_types(X, {"column_2": "categorical"})
+
+    component_graph = ComponentGraph(graph)
+    component_graph.instantiate({'OneHot_RandomForest': {'top_n': 2},
+                                 'OneHot_ElasticNet': {'top_n': 3}})
+    assert component_graph.input_feature_names == {}
+    component_graph.fit(X, y)
+
+    input_feature_names = component_graph.input_feature_names
+    assert input_feature_names['Imputer'] == ['column_1', 'column_2', 'column_3']
+    assert input_feature_names['OneHot'] == ['column_1', 'column_2', 'column_3']
+    assert input_feature_names['DateTime'] == ['column_3', 'column_1_a', 'column_1_b', 'column_1_c', 'column_1_d',
+    'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
+    assert input_feature_names['Scaler'] == ['column_3', 'column_1_a', 'column_1_b', 'column_1_c', 'column_1_d',
+    'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
+    assert input_feature_names['Random Forest'] == ['column_3', 'column_1_a', 'column_1_b', 'column_1_c', 'column_1_d',
+    'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
+    assert input_feature_names['Elastic Net'] == ['column_3', 'column_1_a', 'column_1_b', 'column_1_c', 'column_1_d',
+    'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
+    assert input_feature_names['Logistic Regression'] == ['Random Forest', 'Elastic Net']

From e144a0a055d9d1f509bed368bd26a274e534a00a Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 26 Jan 2021 01:12:54 -0500
Subject: [PATCH 90/98] lint and document

---
 .../pipeline_tests/test_component_graph.py     | 18 +++++++++++-------
 1 file changed, 11 insertions(+), 7 deletions(-)

diff --git a/evalml/tests/pipeline_tests/test_component_graph.py b/evalml/tests/pipeline_tests/test_component_graph.py
index ca27e2016c..2de8307a56 100644
--- a/evalml/tests/pipeline_tests/test_component_graph.py
+++ b/evalml/tests/pipeline_tests/test_component_graph.py
@@ -13,12 +13,14 @@
 from evalml.exceptions import MissingComponentError
 from evalml.pipelines import ComponentGraph
 from evalml.pipelines.components import (
+    DateTimeFeaturizer,
     ElasticNetClassifier,
     Estimator,
     Imputer,
     LogisticRegressionClassifier,
     OneHotEncoder,
     RandomForestClassifier,
+    StandardScaler,
     Transformer
 )
 from evalml.utils.gen_utils import infer_feature_types
@@ -698,8 +700,11 @@ def test_custom_input_feature_types(example_graph):
     assert input_feature_names['Elastic Net'] == ['column_1_a', 'column_1_b', 'column_1_c', 'column_2_3', 'column_2_4', 'column_2_5']
     assert input_feature_names['Logistic Regression'] == ['Random Forest', 'Elastic Net']
 
-from evalml.pipelines.components import DateTimeFeaturizer, StandardScaler
+
 def test_component_graph_dataset_with_different_types():
+    # Checks that types are converted correctly by Woodwork. Specifically, the standard scaler
+    # should convert column_3 to float, so our code to try to convert back to the original boolean type
+    # will catch the TypeError thrown and not convert the column.
     graph = {'Imputer': [Imputer],
              'OneHot': [OneHotEncoder, 'Imputer.x'],
              'DateTime': [DateTimeFeaturizer, 'OneHot.x'],
@@ -715,8 +720,7 @@ def test_component_graph_dataset_with_different_types():
     X = infer_feature_types(X, {"column_2": "categorical"})
 
     component_graph = ComponentGraph(graph)
-    component_graph.instantiate({'OneHot_RandomForest': {'top_n': 2},
-                                 'OneHot_ElasticNet': {'top_n': 3}})
+    component_graph.instantiate({})
     assert component_graph.input_feature_names == {}
     component_graph.fit(X, y)
 
@@ -724,11 +728,11 @@ def test_component_graph_dataset_with_different_types():
     assert input_feature_names['Imputer'] == ['column_1', 'column_2', 'column_3']
     assert input_feature_names['OneHot'] == ['column_1', 'column_2', 'column_3']
     assert input_feature_names['DateTime'] == ['column_3', 'column_1_a', 'column_1_b', 'column_1_c', 'column_1_d',
-    'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
+                                               'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
     assert input_feature_names['Scaler'] == ['column_3', 'column_1_a', 'column_1_b', 'column_1_c', 'column_1_d',
-    'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
+                                             'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
     assert input_feature_names['Random Forest'] == ['column_3', 'column_1_a', 'column_1_b', 'column_1_c', 'column_1_d',
-    'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
+                                                    'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
     assert input_feature_names['Elastic Net'] == ['column_3', 'column_1_a', 'column_1_b', 'column_1_c', 'column_1_d',
-    'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
+                                                  'column_2_1', 'column_2_2', 'column_2_3', 'column_2_4', 'column_2_5', 'column_2_6']
     assert input_feature_names['Logistic Regression'] == ['Random Forest', 'Elastic Net']

From 6e41ee74968e3bef5eaf29e99078c81aa5f5ec26 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 26 Jan 2021 11:05:14 -0500
Subject: [PATCH 91/98] fix some tests

---
 .../test_datetime_featurizer.py               |  2 +-
 .../test_delayed_features_transformer.py      | 26 -------------------
 .../component_tests/test_lgbm_classifier.py   | 20 +++++++-------
 3 files changed, 11 insertions(+), 37 deletions(-)

diff --git a/evalml/tests/component_tests/test_datetime_featurizer.py b/evalml/tests/component_tests/test_datetime_featurizer.py
index 50e93e22b5..67c6550635 100644
--- a/evalml/tests/component_tests/test_datetime_featurizer.py
+++ b/evalml/tests/component_tests/test_datetime_featurizer.py
@@ -105,7 +105,7 @@ def test_datetime_featurizer_no_features_to_extract():
     datetime_transformer = DateTimeFeaturizer(features_to_extract=[])
     rng = pd.date_range('2020-02-24', periods=20, freq='D')
     X = pd.DataFrame({"date col": rng, "numerical": [0] * len(rng)})
-    expected = X
+    expected = pd.DataFrame({"date col": rng, "numerical": [0] * len(rng)})
     expected["numerical"] = expected["numerical"].astype("Int64")
     datetime_transformer.fit(X)
     transformed = datetime_transformer.transform(X).to_dataframe()
diff --git a/evalml/tests/component_tests/test_delayed_features_transformer.py b/evalml/tests/component_tests/test_delayed_features_transformer.py
index 3000137cb7..4cb27c30ea 100644
--- a/evalml/tests/component_tests/test_delayed_features_transformer.py
+++ b/evalml/tests/component_tests/test_delayed_features_transformer.py
@@ -13,7 +13,6 @@ def delayed_features_data():
 
 
 def test_delayed_features_transformer_init():
-
     delayed_features = DelayedFeatureTransformer(max_delay=4, delay_features=True, delay_target=False,
                                                  random_state=1)
     assert delayed_features.parameters == {"max_delay": 4, "delay_features": True, "delay_target": False,
@@ -41,7 +40,6 @@ def encode_X_y_as_strings(X, y, encode_X_as_str, encode_y_as_str):
     X_answer = X
     if encode_X_as_str:
         X, X_answer = encode_X_as_string(X)
-
     return X, X_answer, y, y_answer
 
 
@@ -49,9 +47,7 @@ def encode_X_y_as_strings(X, y, encode_X_as_str, encode_y_as_str):
 @pytest.mark.parametrize('encode_y_as_str', [True, False])
 def test_delayed_feature_extractor_maxdelay3_gap1(encode_X_as_str, encode_y_as_str, delayed_features_data):
     X, y = delayed_features_data
-
     X, X_answer, y, y_answer = encode_X_y_as_strings(X, y, encode_X_as_str, encode_y_as_str)
-
     answer = pd.DataFrame({"feature": X.feature,
                            "feature_delay_1": X_answer.feature.shift(1),
                            "feature_delay_2": X_answer.feature.shift(2),
@@ -76,12 +72,8 @@ def test_delayed_feature_extractor_maxdelay3_gap1(encode_X_as_str, encode_y_as_s
 @pytest.mark.parametrize('encode_X_as_str', [True, False])
 @pytest.mark.parametrize('encode_y_as_str', [True, False])
 def test_delayed_feature_extractor_maxdelay5_gap1(encode_X_as_str, encode_y_as_str, delayed_features_data):
-
     X, y = delayed_features_data
     X, X_answer, y, y_answer = encode_X_y_as_strings(X, y, encode_X_as_str, encode_y_as_str)
-
-    X, X_answer, y, y_answer = encode_X_y_as_strings(X, y, encode_X_as_str, encode_y_as_str)
-
     answer = pd.DataFrame({"feature": X.feature,
                            "feature_delay_1": X_answer.feature.shift(1),
                            "feature_delay_2": X_answer.feature.shift(2),
@@ -110,11 +102,8 @@ def test_delayed_feature_extractor_maxdelay5_gap1(encode_X_as_str, encode_y_as_s
 @pytest.mark.parametrize('encode_X_as_str', [True, False])
 @pytest.mark.parametrize('encode_y_as_str', [True, False])
 def test_delayed_feature_extractor_maxdelay3_gap7(encode_X_as_str, encode_y_as_str, delayed_features_data):
-
     X, y = delayed_features_data
-
     X, X_answer, y, y_answer = encode_X_y_as_strings(X, y, encode_X_as_str, encode_y_as_str)
-
     answer = pd.DataFrame({"feature": X.feature,
                            "feature_delay_1": X_answer.feature.shift(1),
                            "feature_delay_2": X_answer.feature.shift(2),
@@ -137,14 +126,10 @@ def test_delayed_feature_extractor_maxdelay3_gap7(encode_X_as_str, encode_y_as_s
 @pytest.mark.parametrize('encode_X_as_str', [True, False])
 @pytest.mark.parametrize('encode_y_as_str', [True, False])
 def test_delayed_feature_extractor_numpy(encode_X_as_str, encode_y_as_str, delayed_features_data):
-
     X, y = delayed_features_data
-
     X, X_answer, y, y_answer = encode_X_y_as_strings(X, y, encode_X_as_str, encode_y_as_str)
-
     X_np = X.values
     y_np = y.values
-
     answer = pd.DataFrame({0: X.feature,
                            "0_delay_1": X_answer.feature.shift(1),
                            "0_delay_2": X_answer.feature.shift(2),
@@ -171,9 +156,7 @@ def test_lagged_feature_extractor_delay_features_delay_target(encode_y_as_str, e
                                                               delay_target,
                                                               delayed_features_data):
     X, y = delayed_features_data
-
     X, X_answer, y, y_answer = encode_X_y_as_strings(X, y, encode_X_as_str, encode_y_as_str)
-
     all_delays = pd.DataFrame({"feature": X.feature,
                                "feature_delay_1": X_answer.feature.shift(1),
                                "feature_delay_2": X_answer.feature.shift(2),
@@ -200,9 +183,7 @@ def test_lagged_feature_extractor_delay_features_delay_target(encode_y_as_str, e
 def test_lagged_feature_extractor_delay_target(encode_y_as_str, encode_X_as_str, delay_features,
                                                delay_target, delayed_features_data):
     X, y = delayed_features_data
-
     X, X_answer, y, y_answer = encode_X_y_as_strings(X, y, encode_X_as_str, encode_y_as_str)
-
     answer = pd.DataFrame()
     if delay_target:
         answer = pd.DataFrame({"target_delay_0": y_answer.astype("Int64"),
@@ -218,7 +199,6 @@ def test_lagged_feature_extractor_delay_target(encode_y_as_str, encode_X_as_str,
 @pytest.mark.parametrize("gap", [0, 1, 7])
 def test_target_delay_when_gap_is_0(gap, delayed_features_data):
     X, y = delayed_features_data
-
     expected = pd.DataFrame({"feature": X.feature.astype("Int64"),
                              "feature_delay_1": X.feature.shift(1),
                              "target_delay_0": y.astype("Int64"),
@@ -229,13 +209,11 @@ def test_target_delay_when_gap_is_0(gap, delayed_features_data):
 
     transformer = DelayedFeatureTransformer(max_delay=1, gap=gap)
     assert_frame_equal(expected, transformer.fit_transform(X, y).to_dataframe())
-
     expected = pd.DataFrame({"target_delay_0": y.astype("Int64"),
                              "target_delay_1": y.shift(1)})
 
     if gap == 0:
         expected = expected.drop(columns=["target_delay_0"])
-
     assert_frame_equal(expected, transformer.fit_transform(None, y).to_dataframe())
 
 
@@ -245,14 +223,11 @@ def test_target_delay_when_gap_is_0(gap, delayed_features_data):
 def test_delay_feature_transformer_supports_custom_index(encode_X_as_str, encode_y_as_str, data_type, make_data_type,
                                                          delayed_features_data):
     X, y = delayed_features_data
-
     X, X_answer, y, y_answer = encode_X_y_as_strings(X, y, encode_X_as_str, encode_y_as_str)
-
     X.index = pd.RangeIndex(50, 81)
     X_answer.index = pd.RangeIndex(50, 81)
     y.index = pd.RangeIndex(50, 81)
     y_answer.index = pd.RangeIndex(50, 81)
-
     answer = pd.DataFrame({"feature": X.feature,
                            "feature_delay_1": X_answer.feature.shift(1),
                            "feature_delay_2": X_answer.feature.shift(2),
@@ -277,7 +252,6 @@ def test_delay_feature_transformer_supports_custom_index(encode_X_as_str, encode
 
 
 def test_delay_feature_transformer_multiple_categorical_columns(delayed_features_data):
-
     X, y = delayed_features_data
     X, X_answer, y, y_answer = encode_X_y_as_strings(X, y, True, True)
     X['feature_2'] = pd.Categorical(["a"] * 10 + ['aa'] * 10 + ['aaa'] * 10 + ['aaaa'])
diff --git a/evalml/tests/component_tests/test_lgbm_classifier.py b/evalml/tests/component_tests/test_lgbm_classifier.py
index bd2d4cb779..90b535f317 100644
--- a/evalml/tests/component_tests/test_lgbm_classifier.py
+++ b/evalml/tests/component_tests/test_lgbm_classifier.py
@@ -132,8 +132,8 @@ def test_fit_string_features(X_y_binary):
     np.testing.assert_almost_equal(y_pred_proba_sk, y_pred_proba.to_dataframe().values, decimal=5)
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba', return_value=ww.DataTable(pd.DataFrame()))
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba')
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_fit_no_categories(mock_fit, mock_predict, mock_predict_proba, X_y_binary):
     X, y = X_y_binary
@@ -153,8 +153,8 @@ def test_fit_no_categories(mock_fit, mock_predict, mock_predict_proba, X_y_binar
     np.testing.assert_array_equal(arg_X, X2)
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba', return_value=ww.DataTable(pd.DataFrame()))
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba')
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_correct_args(mock_fit, mock_predict, mock_predict_proba, X_y_binary):
     X, y = X_y_binary
@@ -190,8 +190,8 @@ def test_correct_args(mock_fit, mock_predict, mock_predict_proba, X_y_binary):
     assert_frame_equal(X_expected, arg_X)
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba', return_value=ww.DataTable(pd.DataFrame()))
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba')
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_categorical_data_subset(mock_fit, mock_predict, mock_predict_proba, X_y_binary):
     X = pd.DataFrame({"feature_1": [0, 0, 1, 1, 0, 1], "feature_2": ["a", "a", "b", "b", "c", "c"]})
@@ -218,8 +218,8 @@ def test_categorical_data_subset(mock_fit, mock_predict, mock_predict_proba, X_y
     assert_frame_equal(X_expected_subset, arg_X)
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba', return_value=ww.DataTable(pd.DataFrame()))
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict_proba')
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_multiple_fit(mock_fit, mock_predict, mock_predict_proba):
     y = pd.Series([1] * 4)
@@ -251,7 +251,7 @@ def test_multiple_fit(mock_fit, mock_predict, mock_predict_proba):
     assert_frame_equal(X2_predict_expected, mock_predict_proba.call_args[0][0])
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_multiclass_label(mock_fit, mock_predict, X_y_multi):
     X, y = X_y_multi
@@ -266,7 +266,7 @@ def test_multiclass_label(mock_fit, mock_predict, X_y_multi):
     clf.predict(X)
 
 
-@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict', return_value=ww.DataColumn(pd.Series()))
+@patch('evalml.pipelines.components.estimators.estimator.Estimator.predict')
 @patch('evalml.pipelines.components.component_base.ComponentBase.fit')
 def test_binary_label_encoding(mock_fit, mock_predict, X_y_binary):
     X, y = X_y_binary

From ade7fb55125a3685c1f49aed0b8332f15b512668 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 26 Jan 2021 13:39:48 -0500
Subject: [PATCH 92/98] fix docstr

---
 evalml/automl/utils.py | 7 -------
 1 file changed, 7 deletions(-)

diff --git a/evalml/automl/utils.py b/evalml/automl/utils.py
index a8a64ebe15..088526cf98 100644
--- a/evalml/automl/utils.py
+++ b/evalml/automl/utils.py
@@ -43,17 +43,10 @@ def make_data_splitter(X, y, problem_type, problem_configuration=None, n_splits=
         y (ww.DataColumn, pd.Series): The target training data of length [n_samples].
         problem_type (ProblemType): The type of machine learning problem.
         problem_configuration (dict, None): Additional parameters needed to configure the search. For example,
-<<<<<<< HEAD
             in time series problems, values should be passed in for the gap and max_delay variables. Defaults to None.
         n_splits (int, None): The number of CV splits, if applicable. Defaults to 3.
         shuffle (bool): Whether or not to shuffle the data before splitting, if applicable. Defaults to True.
-        random_state (int, np.random.RandomState): Seed for the random number generator. Defaults to 0.
-=======
-            in time series problems, values should be passed in for the gap and max_delay variables.
-        n_splits (int, None): the number of CV splits, if applicable. Default 3.
-        shuffle (bool): whether or not to shuffle the data before splitting, if applicable. Default True.
         random_state (int): Seed for the random number generator. Defaults to 0.
->>>>>>> main
 
     Returns:
         sklearn.model_selection.BaseCrossValidator: Data splitting method.

From c084c4dbc83ec6a0d1db37666e33415eb4b0c21b Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 26 Jan 2021 14:18:30 -0500
Subject: [PATCH 93/98] update tests

---
 evalml/tests/automl_tests/test_automl.py        |  2 +-
 evalml/tests/component_tests/test_components.py | 16 ++++++++--------
 2 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/evalml/tests/automl_tests/test_automl.py b/evalml/tests/automl_tests/test_automl.py
index e00d4b8d45..21df31e27b 100644
--- a/evalml/tests/automl_tests/test_automl.py
+++ b/evalml/tests/automl_tests/test_automl.py
@@ -72,7 +72,7 @@ def test_search_results(X_y_regression, X_y_binary, X_y_multi, automl_type):
         expected_pipeline_class = MulticlassClassificationPipeline
         X, y = X_y_multi
 
-    automl = AutoMLSearch(X_train=X, y_train=y, problem_type=automl_type, max_iterations=2, n_jobs=1, error_callback=raise_error_callback)
+    automl = AutoMLSearch(X_train=X, y_train=y, problem_type=automl_type, max_iterations=2, n_jobs=1)
     automl.search()
     assert automl.results.keys() == {'pipeline_results', 'search_order', 'errors'}
     assert automl.results['search_order'] == [0, 1]
diff --git a/evalml/tests/component_tests/test_components.py b/evalml/tests/component_tests/test_components.py
index 899b2ea949..17e1a77f0e 100644
--- a/evalml/tests/component_tests/test_components.py
+++ b/evalml/tests/component_tests/test_components.py
@@ -590,13 +590,13 @@ def __init__(self):
             pass
 
         def fit(self, X, y):
-            pass
+            return self
 
         def predict(self, X):
-            return pd.Series()
+            return ww.DataColumn(pd.Series())
 
         def predict_proba(self, X):
-            return pd.DataFrame()
+            return ww.DataTable(pd.DataFrame())
 
     class MockEstimator(Estimator):
         name = "Mock Estimator"
@@ -625,7 +625,7 @@ def __init__(self):
             pass
 
         def fit(self, X, y):
-            pass
+            return self
 
         def transform(self, X, y=None):
             return ww.DataTable(X)
@@ -651,19 +651,19 @@ class MockTransformerWithOverride(Transformer):
         name = "Mock Transformer"
 
         def fit(self, X, y):
-            pass
+            return self
 
         def transform(self, X):
-            pass
+            return ww.DataTable(pd.DataFrame())
 
     class MockTransformerWithOverrideSubclass(Transformer):
         name = "Mock Transformer Subclass"
 
         def fit(self, X, y):
-            pass
+            return self
 
         def transform(self, X):
-            pass
+            return ww.DataTable(pd.DataFrame())
 
     X, y = X_y_binary
     transformer = MockTransformerWithOverride()

From a8149f7b1e2a230b8dc39debe8020ed78908636c Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 26 Jan 2021 14:20:15 -0500
Subject: [PATCH 94/98] test docstr update

---
 evalml/pipelines/components/ensemble/stacked_ensemble_base.py    | 1 +
 .../pipelines/components/ensemble/stacked_ensemble_classifier.py | 1 +
 .../pipelines/components/ensemble/stacked_ensemble_regressor.py  | 1 +
 3 files changed, 3 insertions(+)

diff --git a/evalml/pipelines/components/ensemble/stacked_ensemble_base.py b/evalml/pipelines/components/ensemble/stacked_ensemble_base.py
index 25b5b713a9..76918d6c04 100644
--- a/evalml/pipelines/components/ensemble/stacked_ensemble_base.py
+++ b/evalml/pipelines/components/ensemble/stacked_ensemble_base.py
@@ -24,6 +24,7 @@ def __init__(self, input_pipelines=None, final_estimator=None, cv=None, n_jobs=N
             cv (int, cross-validation generator or an iterable): Determines the cross-validation splitting strategy used to train final_estimator.
                 For int/None inputs, if the estimator is a classifier and y is either binary or multiclass, StratifiedKFold is used. In all other cases, KFold is used.
                 Possible inputs for cv are:
+
                 - None: 5-fold cross validation
                 - int: the number of folds in a (Stratified) KFold
                 - An scikit-learn cross-validation generator object
diff --git a/evalml/pipelines/components/ensemble/stacked_ensemble_classifier.py b/evalml/pipelines/components/ensemble/stacked_ensemble_classifier.py
index 979bca0e4d..df5a46adbb 100644
--- a/evalml/pipelines/components/ensemble/stacked_ensemble_classifier.py
+++ b/evalml/pipelines/components/ensemble/stacked_ensemble_classifier.py
@@ -29,6 +29,7 @@ def __init__(self, input_pipelines=None, final_estimator=None,
             cv (int, cross-validation generator or an iterable): Determines the cross-validation splitting strategy used to train final_estimator.
                 For int/None inputs, if the estimator is a classifier and y is either binary or multiclass, StratifiedKFold is used. Defaults to None.
                 Possible inputs for cv are:
+
                 - None: 3-fold cross validation
                 - int: the number of folds in a (Stratified) KFold
                 - An scikit-learn cross-validation generator object
diff --git a/evalml/pipelines/components/ensemble/stacked_ensemble_regressor.py b/evalml/pipelines/components/ensemble/stacked_ensemble_regressor.py
index 54a1460154..730ead472a 100644
--- a/evalml/pipelines/components/ensemble/stacked_ensemble_regressor.py
+++ b/evalml/pipelines/components/ensemble/stacked_ensemble_regressor.py
@@ -28,6 +28,7 @@ def __init__(self, input_pipelines=None, final_estimator=None,
             cv (int, cross-validation generator or an iterable): Determines the cross-validation splitting strategy used to train final_estimator.
                 For int/None inputs, KFold is used. Defaults to None.
                 Possible inputs for cv are:
+
                 - None: 3-fold cross validation
                 - int: the number of folds in a (Stratified) KFold
                 - An scikit-learn cross-validation generator object

From bd182e193784a194407f5142136a1783676a5679 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 26 Jan 2021 15:30:38 -0500
Subject: [PATCH 95/98] more cleanup, update partial dep impl

---
 Makefile                                       |  8 ++++----
 evalml/model_understanding/graphs.py           |  8 --------
 .../prediction_explanations/_user_interface.py |  2 +-
 evalml/objectives/utils.py                     |  2 +-
 evalml/pipelines/component_graph.py            |  2 +-
 .../classifiers/baseline_classifier.py         |  2 +-
 .../transformers/encoders/onehot_encoder.py    |  2 +-
 .../feature_selection/feature_selector.py      |  4 ++--
 evalml/pipelines/components/utils.py           |  9 +++++++++
 evalml/pipelines/pipeline_base.py              |  5 ++---
 .../tests/component_tests/test_components.py   |  6 ------
 .../test_datetime_featurizer.py                |  2 +-
 .../model_understanding_tests/test_graphs.py   | 18 ------------------
 13 files changed, 23 insertions(+), 47 deletions(-)

diff --git a/Makefile b/Makefile
index 4ea75e6802..e14bbc0392 100644
--- a/Makefile
+++ b/Makefile
@@ -18,19 +18,19 @@ lint-fix:
 
 .PHONY: test
 test:
-	pytest evalml/ --doctest-modules --doctest-continue-on-failure --durations=0
+	pytest evalml/ --doctest-modules --doctest-continue-on-failure
 
 .PHONY: circleci-test
 circleci-test:
-	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v --durations=0
+	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v
 
 .PHONY: circleci-test-minimal-deps
 circleci-test-minimal-deps:
-	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v --has-minimal-dependencies --durations=0
+	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v --has-minimal-dependencies
 
 .PHONY: win-circleci-test
 win-circleci-test:
-	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v --durations=0
+	pytest evalml/ -n 8 --doctest-modules --cov=evalml --junitxml=test-reports/junit.xml --doctest-continue-on-failure -v
 
 .PHONY: installdeps
 installdeps:
diff --git a/evalml/model_understanding/graphs.py b/evalml/model_understanding/graphs.py
index bfffbbae44..541aa5c1bc 100644
--- a/evalml/model_understanding/graphs.py
+++ b/evalml/model_understanding/graphs.py
@@ -488,14 +488,6 @@ def partial_dependence(pipeline, X, features, grid_resolution=100):
         warnings.warn("There are null values in the features, which will cause NaN values in the partial dependence output. Fill in these values to remove the NaN values.", NullsInColumnWarning)
 
     wrapped = evalml.pipelines.components.utils.scikit_learn_wrapped_estimator(pipeline)
-    if isinstance(pipeline, evalml.pipelines.ClassificationPipeline):
-        wrapped._estimator_type = "classifier"
-        wrapped.classes_ = pipeline.classes_
-    elif isinstance(pipeline, evalml.pipelines.RegressionPipeline):
-        wrapped._estimator_type = "regressor"
-    wrapped.feature_importances_ = pipeline.feature_importance
-    wrapped._is_fitted = True
-
     avg_pred, values = sk_partial_dependence(wrapped, X=X, features=features, grid_resolution=grid_resolution)
 
     classes = None
diff --git a/evalml/model_understanding/prediction_explanations/_user_interface.py b/evalml/model_understanding/prediction_explanations/_user_interface.py
index d12d67ee06..b66556e6b1 100644
--- a/evalml/model_understanding/prediction_explanations/_user_interface.py
+++ b/evalml/model_understanding/prediction_explanations/_user_interface.py
@@ -23,7 +23,7 @@ def _make_rows(shap_values, normalized_values, pipeline_features, top_k, include
         convert_numeric_to_string (bool): Whether numeric values should be converted to strings from numeric
 
     Returns:
-          list(str)
+          list[str]
     """
     tuples = [(value[0], feature_name) for feature_name, value in normalized_values.items()]
 
diff --git a/evalml/objectives/utils.py b/evalml/objectives/utils.py
index 34f0abfc2f..4068c1d4c0 100644
--- a/evalml/objectives/utils.py
+++ b/evalml/objectives/utils.py
@@ -46,7 +46,7 @@ def get_core_objective_names():
     """Get a list of all valid core objectives.
 
     Returns:
-        list(str): Objective names.
+        list[str]: Objective names.
     """
     all_objectives = _all_objectives_dict()
     non_core = get_non_core_objectives()
diff --git a/evalml/pipelines/component_graph.py b/evalml/pipelines/component_graph.py
index d2e0a25c38..342e7e3f49 100644
--- a/evalml/pipelines/component_graph.py
+++ b/evalml/pipelines/component_graph.py
@@ -298,7 +298,7 @@ def get_parents(self, component_name):
             component_name (str): Name of the child component to look up
 
         Returns:
-            list(str): Iterator of parent component names
+            list[str]: Iterator of parent component names
         """
         try:
             component_info = self.component_dict[component_name]
diff --git a/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py b/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
index 74bc45ec4c..ef566999fd 100644
--- a/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
+++ b/evalml/pipelines/components/estimators/classifiers/baseline_classifier.py
@@ -97,6 +97,6 @@ def classes_(self):
         """Returns class labels. Will return None before fitting.
 
         Returns:
-            list(str) or list(float) : Class names
+            list[str] or list(float) : Class names
         """
         return self._classes
diff --git a/evalml/pipelines/components/transformers/encoders/onehot_encoder.py b/evalml/pipelines/components/transformers/encoders/onehot_encoder.py
index 6bdcada66d..02f5313ebd 100644
--- a/evalml/pipelines/components/transformers/encoders/onehot_encoder.py
+++ b/evalml/pipelines/components/transformers/encoders/onehot_encoder.py
@@ -34,7 +34,7 @@ def __init__(self,
         Arguments:
             top_n (int): Number of categories per column to encode. If None, all categories will be encoded.
                 Otherwise, the `n` most frequent will be encoded and all others will be dropped. Defaults to 10.
-            features_to_encode (list(str)): List of columns to encode. All other columns will remain untouched.
+            features_to_encode (list[str]): List of columns to encode. All other columns will remain untouched.
                 If None, all appropriate columns will be encoded. Defaults to None.
             categories (list): A two dimensional list of categories, where `categories[i]` is a list of the categories
                 for the column at index `i`. This can also be `None`, or `"auto"` if `top_n` is not None. Defaults to None.
diff --git a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
index e3086fdd1a..2b15c8c3d9 100644
--- a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
+++ b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
@@ -14,7 +14,7 @@ def get_names(self):
         """Get names of selected features.
 
         Returns:
-            List of the names of features selected
+            list[str]: List of the names of features selected
         """
         selected_masks = self._component_obj.get_support()
         return [feature_name for (selected, feature_name) in zip(selected_masks, self.input_feature_names) if selected]
@@ -23,7 +23,7 @@ def transform(self, X, y=None):
         """Transforms input data by selecting features.
 
         Arguments:
-            X (ww.DataTable, pd.DataFrame): Data to transform
+            X (ww.DataTable, pd.DataFrame): Data to transform.
             y (ww.DataColumn, pd.Series, optional): Target data. Ignored.
 
         Returns:
diff --git a/evalml/pipelines/components/utils.py b/evalml/pipelines/components/utils.py
index 281c7df287..1877352e5a 100644
--- a/evalml/pipelines/components/utils.py
+++ b/evalml/pipelines/components/utils.py
@@ -122,6 +122,11 @@ def __init__(self, pipeline):
             pipeline (PipelineBase or subclass obj): EvalML pipeline
         """
         self.pipeline = pipeline
+        self._estimator_type = "classifier"
+        if pipeline._is_fitted:
+            self.feature_importances_ = pipeline.feature_importance
+            self._is_fitted = True
+            self.classes_ = pipeline.classes_
 
     def fit(self, X, y):
         """Fits component to data
@@ -176,6 +181,10 @@ def __init__(self, pipeline):
             pipeline (PipelineBase or subclass obj): EvalML pipeline
         """
         self.pipeline = pipeline
+        self._estimator_type = "regressor"
+        if pipeline._is_fitted:
+            self.feature_importances_ = pipeline.feature_importance
+            self._is_fitted = True
 
     def fit(self, X, y):
         """Fits component to data
diff --git a/evalml/pipelines/pipeline_base.py b/evalml/pipelines/pipeline_base.py
index e1cd5b9c1e..674f504b09 100644
--- a/evalml/pipelines/pipeline_base.py
+++ b/evalml/pipelines/pipeline_base.py
@@ -112,8 +112,7 @@ def summary(cls):
 
     @classproperty
     def linearized_component_graph(cls):
-        """Returns a component graph in list form. Note: this is not guaranteed to be in proper component computation order
-        """
+        """Returns a component graph in list form. Note: this is not guaranteed to be in proper component computation order"""
         if isinstance(cls.component_graph, list):
             return cls.component_graph
         else:
@@ -253,7 +252,7 @@ def _score_all_objectives(self, X, y, y_pred, y_pred_proba, objectives):
             objectives (list): List of objectives to score.
 
         Returns:
-            Ordered dictionary with objectives and their scores.
+            dict: Ordered dictionary with objectives and their scores.
         """
         scored_successfully = OrderedDict()
         exceptions = OrderedDict()
diff --git a/evalml/tests/component_tests/test_components.py b/evalml/tests/component_tests/test_components.py
index 17e1a77f0e..ad6740de3c 100644
--- a/evalml/tests/component_tests/test_components.py
+++ b/evalml/tests/component_tests/test_components.py
@@ -535,15 +535,12 @@ def test_transformer_transform_output_type(X_y_binary):
 
             if isinstance(component, SelectColumns):
                 assert transform_output.shape == (X.shape[0], 0)
-                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             elif isinstance(component, PCA) or isinstance(component, LinearDiscriminantAnalysis):
                 assert transform_output.shape[0] == X.shape[0]
                 assert transform_output.shape[1] <= X.shape[1]
-                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             elif isinstance(component, DFSTransformer):
                 assert transform_output.shape[0] == X.shape[0]
                 assert transform_output.shape[1] >= X.shape[1]
-                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             elif isinstance(component, DelayedFeatureTransformer):
                 # We just want to check that DelayedFeaturesTransformer outputs a DataFrame
                 # The dataframe shape and index are checked in test_delayed_features_transformer.py
@@ -557,15 +554,12 @@ def test_transformer_transform_output_type(X_y_binary):
 
             if isinstance(component, SelectColumns):
                 assert transform_output.shape == (X.shape[0], 0)
-                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             elif isinstance(component, PCA) or isinstance(component, LinearDiscriminantAnalysis):
                 assert transform_output.shape[0] == X.shape[0]
                 assert transform_output.shape[1] <= X.shape[1]
-                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             elif isinstance(component, DFSTransformer):
                 assert transform_output.shape[0] == X.shape[0]
                 assert transform_output.shape[1] >= X.shape[1]
-                assert isinstance(transform_output.to_dataframe().columns, pd.Index)
             else:
                 assert transform_output.shape == X.shape
                 assert (list(transform_output.columns) == list(X_cols_expected))
diff --git a/evalml/tests/component_tests/test_datetime_featurizer.py b/evalml/tests/component_tests/test_datetime_featurizer.py
index 67c6550635..0a1a5b4c3c 100644
--- a/evalml/tests/component_tests/test_datetime_featurizer.py
+++ b/evalml/tests/component_tests/test_datetime_featurizer.py
@@ -105,7 +105,7 @@ def test_datetime_featurizer_no_features_to_extract():
     datetime_transformer = DateTimeFeaturizer(features_to_extract=[])
     rng = pd.date_range('2020-02-24', periods=20, freq='D')
     X = pd.DataFrame({"date col": rng, "numerical": [0] * len(rng)})
-    expected = pd.DataFrame({"date col": rng, "numerical": [0] * len(rng)})
+    expected = X.copy()
     expected["numerical"] = expected["numerical"].astype("Int64")
     datetime_transformer.fit(X)
     transformed = datetime_transformer.transform(X).to_dataframe()
diff --git a/evalml/tests/model_understanding_tests/test_graphs.py b/evalml/tests/model_understanding_tests/test_graphs.py
index 4ae120ab66..6edbfeb0a8 100644
--- a/evalml/tests/model_understanding_tests/test_graphs.py
+++ b/evalml/tests/model_understanding_tests/test_graphs.py
@@ -743,24 +743,6 @@ def test_partial_dependence_problem_types(data_type, problem_type, X_y_binary, X
     part_dep = partial_dependence(pipeline, X, features=0, grid_resolution=20)
     check_partial_dependence_dataframe(pipeline, part_dep)
     assert not part_dep.isnull().any(axis=None)
-    with pytest.raises(AttributeError):
-        pipeline._estimator_type
-    with pytest.raises(AttributeError):
-        pipeline.feature_importances_
-
-
-@patch('evalml.model_understanding.graphs.sk_partial_dependence')
-def test_partial_dependence_error_still_deletes_attributes(mock_part_dep, X_y_binary, logistic_regression_binary_pipeline_class):
-    X, y = X_y_binary
-    pipeline = logistic_regression_binary_pipeline_class(parameters={"Logistic Regression Classifier": {"n_jobs": 1}})
-    pipeline.fit(X, y)
-    mock_part_dep.side_effect = Exception()
-    with pytest.raises(Exception):
-        partial_dependence(pipeline, X, features=0, grid_resolution=20)
-    with pytest.raises(AttributeError):
-        pipeline._estimator_type
-    with pytest.raises(AttributeError):
-        pipeline.feature_importances_
 
 
 def test_partial_dependence_string_feature_name(logistic_regression_binary_pipeline_class):

From 11dd1af984a5d6bf2b37f15c0d7333db26edf3d8 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 26 Jan 2021 15:57:55 -0500
Subject: [PATCH 96/98] some more cleanup of feature selector and baseline
 tests

---
 .../feature_selection/feature_selector.py     |  5 +-
 .../delayed_feature_transformer.py            |  4 +-
 .../components/transformers/transformer.py    |  6 +--
 .../test_baseline_classifier.py               | 44 ++++++++++-------
 .../test_baseline_regressor.py                |  7 ++-
 .../component_tests/test_feature_selectors.py | 23 ++++++++-
 .../test_baseline_classification.py           | 48 +++++++++----------
 .../test_baseline_regression.py               |  7 ++-
 8 files changed, 91 insertions(+), 53 deletions(-)

diff --git a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
index 2b15c8c3d9..8d38da397f 100644
--- a/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
+++ b/evalml/pipelines/components/transformers/feature_selection/feature_selector.py
@@ -1,5 +1,6 @@
 import pandas as pd
 
+from evalml.exceptions import MethodPropertyNotFoundError
 from evalml.pipelines.components.transformers import Transformer
 from evalml.utils.gen_utils import (
     _convert_to_woodwork_structure,
@@ -20,7 +21,7 @@ def get_names(self):
         return [feature_name for (selected, feature_name) in zip(selected_masks, self.input_feature_names) if selected]
 
     def transform(self, X, y=None):
-        """Transforms input data by selecting features.
+        """Transforms input data by selecting features. If the component_obj does not have a transform method, will raise an MethodPropertyNotFoundError exception.
 
         Arguments:
             X (ww.DataTable, pd.DataFrame): Data to transform.
@@ -36,7 +37,7 @@ def transform(self, X, y=None):
         try:
             X_t = self._component_obj.transform(X)
         except AttributeError:
-            raise RuntimeError("Feature selector requires a transform method or a component_obj that implements transform")
+            raise MethodPropertyNotFoundError("Feature selector requires a transform method or a component_obj that implements transform")
 
         X_dtypes = X.dtypes.to_dict()
         selected_col_names = self.get_names()
diff --git a/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py b/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
index 11bafb04d9..daa3d381e9 100644
--- a/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
+++ b/evalml/pipelines/components/transformers/preprocessing/delayed_feature_transformer.py
@@ -45,8 +45,8 @@ def fit(self, X, y=None):
         """Fits the DelayFeatureTransformer.
 
         Arguments:
-            X (ww.DataTable, pd.DataFrame or np.ndarray): the input training data of shape [n_samples, n_features]
-            y (ww.DataColumn, pd.Series, optional): the target training data of length [n_samples]
+            X (ww.DataTable, pd.DataFrame or np.ndarray): The input training data of shape [n_samples, n_features]
+            y (ww.DataColumn, pd.Series, optional): The target training data of length [n_samples]
 
         Returns:
             self
diff --git a/evalml/pipelines/components/transformers/transformer.py b/evalml/pipelines/components/transformers/transformer.py
index ead4c3a5ed..cd2b4cf9c6 100644
--- a/evalml/pipelines/components/transformers/transformer.py
+++ b/evalml/pipelines/components/transformers/transformer.py
@@ -25,11 +25,11 @@ class Transformer(ComponentBase):
     model_family = ModelFamily.NONE
 
     def transform(self, X, y=None):
-        """Transforms data X
+        """Transforms data X.
 
         Arguments:
-            X (ww.DataTable, pd.DataFrame): Data to transform
-            y (ww.DataColumn, pd.Series, optional): Target data
+            X (ww.DataTable, pd.DataFrame): Data to transform.
+            y (ww.DataColumn, pd.Series, optional): Target data.
 
         Returns:
             ww.DataTable: Transformed X
diff --git a/evalml/tests/component_tests/test_baseline_classifier.py b/evalml/tests/component_tests/test_baseline_classifier.py
index ceca215d0c..cab3fecba6 100644
--- a/evalml/tests/component_tests/test_baseline_classifier.py
+++ b/evalml/tests/component_tests/test_baseline_classifier.py
@@ -37,13 +37,14 @@ def test_baseline_binary_mode(data_type, make_data_type):
     fitted = clf.fit(X, y)
     assert isinstance(fitted, BaselineClassifier)
     assert clf.classes_ == [10, 11]
+    expected_predictions = pd.Series(np.array([10] * X.shape[0]), dtype="Int64")
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series(np.array([10] * X.shape[0]), dtype="Int64"), predictions.to_series())
+    assert_series_equal(expected_predictions, predictions.to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (X.shape[0], 2)
-    expected_predicted_proba = pd.DataFrame({10: [1., 1., 1., 1.], 11: [0., 0., 0., 0.]})
-    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+    expected_predictions_proba = pd.DataFrame({10: [1., 1., 1., 1.], 11: [0., 0., 0., 0.]})
+    assert_frame_equal(expected_predictions_proba, predicted_proba.to_dataframe())
 
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
@@ -55,13 +56,14 @@ def test_baseline_binary_random(X_y_binary):
     clf.fit(X, y)
     assert clf.classes_ == [0, 1]
 
+    expected_predictions = pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64")
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64"), predictions.to_series())
+    assert_series_equal(expected_predictions, predictions.to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 2)
-    expected_predicted_proba = pd.DataFrame(np.array([[0.5 for i in range(len(values))]] * len(X)))
-    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+    expected_predictions_proba = pd.DataFrame(np.array([[0.5 for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predictions_proba, predicted_proba.to_dataframe())
 
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
@@ -71,16 +73,19 @@ def test_baseline_binary_random_weighted(X_y_binary):
     values, counts = np.unique(y, return_counts=True)
     percent_freq = counts.astype(float) / len(y)
     assert percent_freq.sum() == 1.0
+
     clf = BaselineClassifier(strategy="random_weighted", random_state=0)
     clf.fit(X, y)
+
     assert clf.classes_ == [0, 1]
+    expected_predictions = pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64")
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64"), predictions.to_series())
+    assert_series_equal(expected_predictions, predictions.to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 2)
-    expected_predicted_proba = pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
-    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+    expected_predictions_proba = pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predictions_proba, predicted_proba.to_dataframe())
 
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
@@ -90,14 +95,16 @@ def test_baseline_multiclass_mode():
     y = pd.Series([10, 12, 11, 11])
     clf = BaselineClassifier(strategy="mode")
     clf.fit(X, y)
+
     assert clf.classes_ == [10, 11, 12]
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series(np.array([11] * len(X)), dtype="Int64"), predictions.to_series())
+    expected_predictions = pd.Series([11] * len(X), dtype="Int64")
+    assert_series_equal(expected_predictions, predictions.to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
-    expected_predicted_proba = pd.DataFrame({10: [0., 0., 0., 0.], 11: [1., 1., 1., 1.], 12: [0., 0., 0., 0.]})
-    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+    expected_predictions_proba = pd.DataFrame({10: [0., 0., 0., 0.], 11: [1., 1., 1., 1.], 12: [0., 0., 0., 0.]})
+    assert_frame_equal(expected_predictions_proba, predicted_proba.to_dataframe())
 
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
@@ -107,9 +114,11 @@ def test_baseline_multiclass_random(X_y_multi):
     values = np.unique(y)
     clf = BaselineClassifier(strategy="random", random_state=0)
     clf.fit(X, y)
+
     assert clf.classes_ == [0, 1, 2]
+    expected_predictions = pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64")
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64"), predictions.to_series())
+    assert_series_equal(expected_predictions, predictions.to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
@@ -124,10 +133,11 @@ def test_baseline_multiclass_random_weighted(X_y_multi):
     assert percent_freq.sum() == 1.0
     clf = BaselineClassifier(strategy="random_weighted", random_state=0)
     clf.fit(X, y)
-    assert clf.classes_ == [0, 1, 2]
 
+    assert clf.classes_ == [0, 1, 2]
+    expected_predictions = pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64")
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64"), predictions.to_series())
+    assert_series_equal(expected_predictions, predictions.to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
@@ -141,9 +151,11 @@ def test_baseline_no_mode():
     y = pd.Series([1, 0, 2, 0, 1])
     clf = BaselineClassifier()
     clf.fit(X, y)
+
     assert clf.classes_ == [0, 1, 2]
+    expected_predictions = pd.Series([0] * len(X), dtype="Int64")
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series([0] * len(X), dtype="Int64"), predictions.to_series())
+    assert_series_equal(expected_predictions, predictions.to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
diff --git a/evalml/tests/component_tests/test_baseline_regressor.py b/evalml/tests/component_tests/test_baseline_regressor.py
index 8a71cc3aab..d28fb70523 100644
--- a/evalml/tests/component_tests/test_baseline_regressor.py
+++ b/evalml/tests/component_tests/test_baseline_regressor.py
@@ -32,8 +32,9 @@ def test_baseline_mean(X_y_regression):
     fitted = clf.fit(X, y)
     assert isinstance(fitted, BaselineRegressor)
 
+    expected_predictions = pd.Series([mean] * len(X))
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series([mean] * len(X)), predictions.to_series())
+    assert_series_equal(expected_predictions, predictions.to_series())
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
 
 
@@ -42,6 +43,8 @@ def test_baseline_median(X_y_regression):
     median = np.median(y)
     clf = BaselineRegressor(strategy="median")
     clf.fit(X, y)
+
+    expected_predictions = pd.Series([median] * len(X))
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series([median] * len(X)), predictions.to_series())
+    assert_series_equal(expected_predictions, predictions.to_series())
     np.testing.assert_allclose(clf.feature_importance, np.array([0.0] * X.shape[1]))
diff --git a/evalml/tests/component_tests/test_feature_selectors.py b/evalml/tests/component_tests/test_feature_selectors.py
index 02187bb145..5b9a552d1e 100644
--- a/evalml/tests/component_tests/test_feature_selectors.py
+++ b/evalml/tests/component_tests/test_feature_selectors.py
@@ -1,6 +1,7 @@
 import pandas as pd
 import pytest
 
+from evalml.exceptions import MethodPropertyNotFoundError
 from evalml.pipelines.components import (
     ComponentBase,
     FeatureSelector,
@@ -53,7 +54,25 @@ def fit(self, X, y):
 
     mock_feature_selector = MockFeatureSelector()
     mock_feature_selector.fit(pd.DataFrame(), pd.Series())
-    with pytest.raises(RuntimeError, match="Feature selector requires a transform method or a component_obj that implements transform"):
+    with pytest.raises(MethodPropertyNotFoundError, match="Feature selector requires a transform method or a component_obj that implements transform"):
         mock_feature_selector.transform(pd.DataFrame())
-    with pytest.raises(RuntimeError, match="Feature selector requires a transform method or a component_obj that implements transform"):
+    with pytest.raises(MethodPropertyNotFoundError, match="Feature selector requires a transform method or a component_obj that implements transform"):
+        mock_feature_selector.fit_transform(pd.DataFrame())
+
+
+def test_feature_selector_component_obj_missing_transform():
+    class MockFeatureSelector(FeatureSelector):
+        name = "Mock Feature Selector"
+
+        def __init__(self):
+            self._component_obj = None
+
+        def fit(self, X, y):
+            return self
+
+    mock_feature_selector = MockFeatureSelector()
+    mock_feature_selector.fit(pd.DataFrame(), pd.Series())
+    with pytest.raises(MethodPropertyNotFoundError, match="Feature selector requires a transform method or a component_obj that implements transform"):
+        mock_feature_selector.transform(pd.DataFrame())
+    with pytest.raises(MethodPropertyNotFoundError, match="Feature selector requires a transform method or a component_obj that implements transform"):
         mock_feature_selector.fit_transform(pd.DataFrame())
diff --git a/evalml/tests/pipeline_tests/classification_pipeline_tests/test_baseline_classification.py b/evalml/tests/pipeline_tests/classification_pipeline_tests/test_baseline_classification.py
index 36b80aa91d..f9adf37389 100644
--- a/evalml/tests/pipeline_tests/classification_pipeline_tests/test_baseline_classification.py
+++ b/evalml/tests/pipeline_tests/classification_pipeline_tests/test_baseline_classification.py
@@ -16,13 +16,13 @@ def test_baseline_binary_random(X_y_binary):
     }
     clf = BaselineBinaryPipeline(parameters=parameters)
     clf.fit(X, y)
-    expected_predicted = pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64")
-    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+    expected_predictions = pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64")
+    assert_series_equal(expected_predictions, clf.predict(X).to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 2)
-    expected_predicted_proba = pd.DataFrame(np.array([[0.5 for i in range(len(values))]] * len(X)))
-    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+    expected_predictions_proba = pd.DataFrame(np.array([[0.5 for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predictions_proba, predicted_proba.to_dataframe())
 
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
@@ -41,13 +41,13 @@ def test_baseline_binary_random_weighted(X_y_binary):
     clf = BaselineBinaryPipeline(parameters=parameters)
     clf.fit(X, y)
 
-    expected_predicted = pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64")
-    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+    expected_predictions = pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64")
+    assert_series_equal(expected_predictions, clf.predict(X).to_series())
 
-    expected_predicted_proba = pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
+    expected_predictions_proba = pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 2)
-    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+    assert_frame_equal(expected_predictions_proba, predicted_proba.to_dataframe())
 
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
@@ -63,13 +63,13 @@ def test_baseline_binary_mode():
     clf = BaselineBinaryPipeline(parameters=parameters)
     clf.fit(X, y)
 
-    expected_predicted = pd.Series(np.array([10] * len(X)), dtype="Int64")
-    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+    expected_predictions = pd.Series(np.array([10] * len(X)), dtype="Int64")
+    assert_series_equal(expected_predictions, clf.predict(X).to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 2)
-    expected_predicted_proba = pd.DataFrame({10: [1., 1., 1., 1.], 11: [0., 0., 0., 0.]})
-    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+    expected_predictions_proba = pd.DataFrame({10: [1., 1., 1., 1.], 11: [0., 0., 0., 0.]})
+    assert_frame_equal(expected_predictions_proba, predicted_proba.to_dataframe())
 
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
@@ -85,13 +85,13 @@ def test_baseline_multi_random(X_y_multi):
     clf = BaselineMulticlassPipeline(parameters=parameters)
     clf.fit(X, y)
 
-    expected_predicted = pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64")
-    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+    expected_predictions = pd.Series(get_random_state(0).choice(np.unique(y), len(X)), dtype="Int64")
+    assert_series_equal(expected_predictions, clf.predict(X).to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
-    expected_predicted_proba = pd.DataFrame(np.array([[1. / 3 for i in range(len(values))]] * len(X)))
-    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+    expected_predictions_proba = pd.DataFrame(np.array([[1. / 3 for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predictions_proba, predicted_proba.to_dataframe())
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
 
@@ -109,13 +109,13 @@ def test_baseline_multi_random_weighted(X_y_multi):
     clf = BaselineMulticlassPipeline(parameters=parameters)
     clf.fit(X, y)
 
-    expected_predicted = pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64")
-    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+    expected_predictions = pd.Series(get_random_state(0).choice(np.unique(y), len(X), p=percent_freq), dtype="Int64")
+    assert_series_equal(expected_predictions, clf.predict(X).to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
-    expected_predicted_proba = pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
-    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+    expected_predictions_proba = pd.DataFrame(np.array([[percent_freq[i] for i in range(len(values))]] * len(X)))
+    assert_frame_equal(expected_predictions_proba, predicted_proba.to_dataframe())
 
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
@@ -130,12 +130,12 @@ def test_baseline_multi_mode():
     }
     clf = BaselineMulticlassPipeline(parameters=parameters)
     clf.fit(X, y)
-    expected_predicted = pd.Series(np.array([11] * len(X)), dtype="Int64")
-    assert_series_equal(expected_predicted, clf.predict(X).to_series())
+    expected_predictions = pd.Series(np.array([11] * len(X)), dtype="Int64")
+    assert_series_equal(expected_predictions, clf.predict(X).to_series())
 
     predicted_proba = clf.predict_proba(X)
     assert predicted_proba.shape == (len(X), 3)
-    expected_predicted_proba = pd.DataFrame({10: [0., 0., 0., 0.], 11: [1., 1., 1., 1.], 12: [0., 0., 0., 0.]})
-    assert_frame_equal(expected_predicted_proba, predicted_proba.to_dataframe())
+    expected_predictions_proba = pd.DataFrame({10: [0., 0., 0., 0.], 11: [1., 1., 1., 1.], 12: [0., 0., 0., 0.]})
+    assert_frame_equal(expected_predictions_proba, predicted_proba.to_dataframe())
 
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
diff --git a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_baseline_regression.py b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_baseline_regression.py
index 1eaf3ccef4..4750a45316 100644
--- a/evalml/tests/pipeline_tests/regression_pipeline_tests/test_baseline_regression.py
+++ b/evalml/tests/pipeline_tests/regression_pipeline_tests/test_baseline_regression.py
@@ -15,8 +15,10 @@ def test_baseline_mean(X_y_regression):
     }
     clf = BaselineRegressionPipeline(parameters=parameters)
     clf.fit(X, y)
+
+    expected_predictions = pd.Series([mean] * len(X))
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series([mean] * len(X)), predictions.to_series())
+    assert_series_equal(expected_predictions, predictions.to_series())
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))
 
 
@@ -30,6 +32,7 @@ def test_baseline_median(X_y_regression):
     }
     clf = BaselineRegressionPipeline(parameters=parameters)
     clf.fit(X, y)
+    expected_predictions = pd.Series([median] * len(X))
     predictions = clf.predict(X)
-    assert_series_equal(pd.Series([median] * len(X)), predictions.to_series())
+    assert_series_equal(expected_predictions, predictions.to_series())
     np.testing.assert_allclose(clf.feature_importance.iloc[:, 1], np.array([0.0] * X.shape[1]))

From 8692830530b8c50d881e9be3003ed23b91979919 Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 26 Jan 2021 16:19:04 -0500
Subject: [PATCH 97/98] clean up components notebook

---
 docs/source/user_guide/components.ipynb | 154 ++++++------------------
 1 file changed, 39 insertions(+), 115 deletions(-)

diff --git a/docs/source/user_guide/components.ipynb b/docs/source/user_guide/components.ipynb
index b7cc3af7a6..59c970592b 100644
--- a/docs/source/user_guide/components.ipynb
+++ b/docs/source/user_guide/components.ipynb
@@ -148,8 +148,11 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "import pandas as pd\n",
     "from evalml.pipelines.components import Transformer\n",
+    "from evalml.utils.gen_utils import (\n",
+    "    _convert_to_woodwork_structure,\n",
+    "    _convert_woodwork_types_wrapper\n",
+    ")\n",
     "\n",
     "class DropNullColumns(Transformer):\n",
     "    \"\"\"Transformer to drop features whose percentage of NaN values exceeds a specified threshold\"\"\"\n",
@@ -175,10 +178,19 @@
     "                         random_state=random_state)\n",
     "\n",
     "    def fit(self, X, y=None):\n",
+    "        \"\"\"Fits DropNullColumns component to data\n",
+    "\n",
+    "        Arguments:\n",
+    "            X (list, ww.DataTable, pd.DataFrame): The input training data of shape [n_samples, n_features]\n",
+    "            y (list, ww.DataColumn, pd.Series, np.ndarray, optional): The target training data of length [n_samples]\n",
+    "\n",
+    "        Returns:\n",
+    "            self\n",
+    "        \"\"\"\n",
     "        pct_null_threshold = self.parameters[\"pct_null_threshold\"]\n",
-    "        if not isinstance(X, pd.DataFrame):\n",
-    "            X = pd.DataFrame(X)\n",
-    "        percent_null = X.isnull().mean()\n",
+    "        X_t = _convert_to_woodwork_structure(X)\n",
+    "        X_t = _convert_woodwork_types_wrapper(X_t.to_dataframe())\n",
+    "        percent_null = X_t.isnull().mean()\n",
     "        if pct_null_threshold == 0.0:\n",
     "            null_cols = percent_null[percent_null > 0]\n",
     "        else:\n",
@@ -188,16 +200,16 @@
     "\n",
     "    def transform(self, X, y=None):\n",
     "        \"\"\"Transforms data X by dropping columns that exceed the threshold of null values.\n",
+    "\n",
     "        Arguments:\n",
-    "            X (pd.DataFrame): Data to transform\n",
-    "            y (pd.Series, optional): Targets\n",
+    "            X (ww.DataTable, pd.DataFrame): Data to transform\n",
+    "            y (ww.DataColumn, pd.Series, optional): Ignored.\n",
+    "\n",
     "        Returns:\n",
-    "            pd.DataFrame: Transformed X\n",
+    "            ww.DataTable: Transformed X\n",
     "        \"\"\"\n",
-    "\n",
-    "        if not isinstance(X, pd.DataFrame):\n",
-    "            X = pd.DataFrame(X)\n",
-    "        return X.drop(columns=self._cols_to_drop, axis=1)"
+    "        X_t = _convert_to_woodwork_structure(X)\n",
+    "        return X_t.drop(self._cols_to_drop)"
    ]
   },
   {
@@ -214,9 +226,9 @@
     "\n",
     "-  `__init__()` - the `__init__()` method of your transformer will need to call `super().__init__()` and pass three parameters in: a `parameters` dictionary holding the parameters to the component, the `component_obj`, and the `random_state` value. You can see that `component_obj` is set to `None` above and we will discuss `component_obj` in depth later on.\n",
     "\n",
-    "- `fit()` - the `fit()` method is responsible for fitting your component on training data.\n",
+    "- `fit()` - the `fit()` method is responsible for fitting your component on training data. It should return the component object.\n",
     "\n",
-    "- `transform()` - after fitting a component, the `transform()` method will take in new data and transform accordingly. Note: a component must call `fit()` before `transform()`.\n",
+    "- `transform()` - after fitting a component, the `transform()` method will take in new data and transform accordingly. It should return a Woodwork DataTable. Note: a component must call `fit()` before `transform()`.\n",
     "\n",
     "You can also call or override `fit_transform()` that combines `fit()` and `transform()` into one method."
    ]
@@ -252,14 +264,14 @@
     "    name = \"Baseline Regressor\"\n",
     "    hyperparameter_ranges = {}\n",
     "    model_family = ModelFamily.BASELINE\n",
-    "    supported_problem_types = [ProblemTypes.REGRESSION]\n",
+    "    supported_problem_types = [ProblemTypes.REGRESSION, ProblemTypes.TIME_SERIES_REGRESSION]\n",
     "\n",
     "    def __init__(self, strategy=\"mean\", random_state=0, **kwargs):\n",
     "        \"\"\"Baseline regressor that uses a simple strategy to make predictions.\n",
     "\n",
     "        Arguments:\n",
-    "            strategy (str): Method used to predict. Valid options are \"mean\", \"median\". Defaults to \"mean\".\n",
-    "            random_state (int): Seed for the random number generator\n",
+    "            strategy (str): method used to predict. Valid options are \"mean\", \"median\". Defaults to \"mean\".\n",
+    "            random_state (int): Seed for the random number generator. Defaults to 0.\n",
     "\n",
     "        \"\"\"\n",
     "        if strategy not in [\"mean\", \"median\"]:\n",
@@ -276,9 +288,9 @@
     "    def fit(self, X, y=None):\n",
     "        if y is None:\n",
     "            raise ValueError(\"Cannot fit Baseline regressor if y is None\")\n",
-    "\n",
-    "        if not isinstance(y, pd.Series):\n",
-    "            y = pd.Series(y)\n",
+    "        X = _convert_to_woodwork_structure(X)\n",
+    "        y = _convert_to_woodwork_structure(y)\n",
+    "        y = _convert_woodwork_types_wrapper(y.to_series())\n",
     "\n",
     "        if self.parameters[\"strategy\"] == \"mean\":\n",
     "            self._prediction_value = y.mean()\n",
@@ -288,17 +300,19 @@
     "        return self\n",
     "\n",
     "    def predict(self, X):\n",
-    "        return pd.Series([self._prediction_value] * len(X))\n",
+    "        X = _convert_to_woodwork_structure(X)\n",
+    "        predictions = pd.Series([self._prediction_value] * len(X))\n",
+    "        return _convert_to_woodwork_structure(predictions)\n",
     "\n",
     "    @property\n",
     "    def feature_importance(self):\n",
     "        \"\"\"Returns importance associated with each feature. Since baseline regressors do not use input features to calculate predictions, returns an array of zeroes.\n",
     "\n",
     "        Returns:\n",
-    "            np.ndarray (float): An array of zeroes\n",
+    "            np.ndarray (float): an array of zeroes\n",
     "\n",
     "        \"\"\"\n",
-    "        return np.zeros(self._num_features)"
+    "        return np.zeros(self._num_features)\n"
    ]
   },
   {
@@ -402,45 +416,6 @@
     "AutoML will perform a search over the allowed ranges for each parameter to select models which produce optimal performance within those ranges. AutoML gets the allowed ranges for each component from the component's `hyperparameter_ranges` class attribute. Any component parameter you add an entry for in `hyperparameter_ranges` will be included in the AutoML search. If parameters are omitted, AutoML will use the default value in all pipelines. "
    ]
   },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.linear_model import LinearRegression as SKLinearRegression\n",
-    "\n",
-    "from evalml.model_family import ModelFamily\n",
-    "from evalml.pipelines.components.estimators import Estimator\n",
-    "from evalml.problem_types import ProblemTypes\n",
-    "\n",
-    "class LinearRegressor(Estimator):\n",
-    "    \"\"\"Linear Regressor.\"\"\"\n",
-    "    name = \"Linear Regressor\"\n",
-    "    hyperparameter_ranges = {\n",
-    "        'fit_intercept': [True, False],\n",
-    "        'normalize': [True, False]\n",
-    "    }\n",
-    "    model_family = ModelFamily.LINEAR_MODEL\n",
-    "    supported_problem_types = [ProblemTypes.REGRESSION]\n",
-    "\n",
-    "    def __init__(self, fit_intercept=True, normalize=False, n_jobs=-1, random_state=0, **kwargs):\n",
-    "        parameters = {\n",
-    "            'fit_intercept': fit_intercept,\n",
-    "            'normalize': normalize,\n",
-    "            'n_jobs': n_jobs\n",
-    "        }\n",
-    "        parameters.update(kwargs)\n",
-    "        linear_regressor = SKLinearRegression(**parameters)\n",
-    "        super().__init__(parameters=parameters,\n",
-    "                         component_obj=linear_regressor,\n",
-    "                         random_state=random_state)\n",
-    "\n",
-    "    @property\n",
-    "    def feature_importance(self):\n",
-    "        return self._component_obj.coef_"
-   ]
-  },
   {
    "cell_type": "markdown",
    "metadata": {},
@@ -471,8 +446,7 @@
    "outputs": [],
    "source": [
     "# this string can then be copy and pasted into a separate window and executed as python code\n",
-    "exec(code)\n",
-    "logisticRegressionClassifier"
+    "exec(code)"
    ]
   },
   {
@@ -481,60 +455,10 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# custom component\n",
-    "from evalml.pipelines.components import Transformer\n",
-    "import pandas as pd\n",
+    "# We can also do this for custom components\n",
     "from evalml.pipelines.components.utils import generate_component_code\n",
     "\n",
-    "class MyDropNullColumns(Transformer):\n",
-    "    \"\"\"Transformer to drop features whose percentage of NaN values exceeds a specified threshold\"\"\"\n",
-    "    name = \"My Drop Null Columns Transformer\"\n",
-    "    hyperparameter_ranges = {}\n",
-    "\n",
-    "    def __init__(self, pct_null_threshold=1.0, random_state=0, **kwargs):\n",
-    "        \"\"\"Initalizes an transformer to drop features whose percentage of NaN values exceeds a specified threshold.\n",
-    "\n",
-    "        Arguments:\n",
-    "            pct_null_threshold(float): The percentage of NaN values in an input feature to drop.\n",
-    "                Must be a value between [0, 1] inclusive. If equal to 0.0, will drop columns with any null values.\n",
-    "                If equal to 1.0, will drop columns with all null values. Defaults to 0.95.\n",
-    "        \"\"\"\n",
-    "        if pct_null_threshold < 0 or pct_null_threshold > 1:\n",
-    "            raise ValueError(\"pct_null_threshold must be a float between 0 and 1, inclusive.\")\n",
-    "        parameters = {\"pct_null_threshold\": pct_null_threshold}\n",
-    "        parameters.update(kwargs)\n",
-    "\n",
-    "        self._cols_to_drop = None\n",
-    "        super().__init__(parameters=parameters,\n",
-    "                         component_obj=None,\n",
-    "                         random_state=random_state)\n",
-    "\n",
-    "    def fit(self, X, y=None):\n",
-    "        pct_null_threshold = self.parameters[\"pct_null_threshold\"]\n",
-    "        if not isinstance(X, pd.DataFrame):\n",
-    "            X = pd.DataFrame(X)\n",
-    "        percent_null = X.isnull().mean()\n",
-    "        if pct_null_threshold == 0.0:\n",
-    "            null_cols = percent_null[percent_null > 0]\n",
-    "        else:\n",
-    "            null_cols = percent_null[percent_null >= pct_null_threshold]\n",
-    "        self._cols_to_drop = list(null_cols.index)\n",
-    "        return self\n",
-    "\n",
-    "    def transform(self, X, y=None):\n",
-    "        \"\"\"Transforms data X by dropping columns that exceed the threshold of null values.\n",
-    "        Arguments:\n",
-    "            X (pd.DataFrame): Data to transform\n",
-    "            y (pd.Series, optional): Targets\n",
-    "        Returns:\n",
-    "            pd.DataFrame: Transformed X\n",
-    "        \"\"\"\n",
-    "\n",
-    "        if not isinstance(X, pd.DataFrame):\n",
-    "            X = pd.DataFrame(X)\n",
-    "        return X.drop(columns=self._cols_to_drop, axis=1)\n",
-    "    \n",
-    "myDropNull = MyDropNullColumns()\n",
+    "myDropNull = DropNullColumns()\n",
     "print(generate_component_code(myDropNull))"
    ]
   },

From 0babaca8dcde3c18817d775ecdccabdf80234ebd Mon Sep 17 00:00:00 2001
From: Angela Lin <angela97lin@gmail.com>
Date: Tue, 26 Jan 2021 17:32:37 -0500
Subject: [PATCH 98/98] the tinest of docstring caps cleanup

---
 docs/source/user_guide/components.ipynb                       | 4 ++--
 .../components/estimators/regressors/baseline_regressor.py    | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/source/user_guide/components.ipynb b/docs/source/user_guide/components.ipynb
index 59c970592b..a4e68c81a9 100644
--- a/docs/source/user_guide/components.ipynb
+++ b/docs/source/user_guide/components.ipynb
@@ -270,7 +270,7 @@
     "        \"\"\"Baseline regressor that uses a simple strategy to make predictions.\n",
     "\n",
     "        Arguments:\n",
-    "            strategy (str): method used to predict. Valid options are \"mean\", \"median\". Defaults to \"mean\".\n",
+    "            strategy (str): Method used to predict. Valid options are \"mean\", \"median\". Defaults to \"mean\".\n",
     "            random_state (int): Seed for the random number generator. Defaults to 0.\n",
     "\n",
     "        \"\"\"\n",
@@ -309,7 +309,7 @@
     "        \"\"\"Returns importance associated with each feature. Since baseline regressors do not use input features to calculate predictions, returns an array of zeroes.\n",
     "\n",
     "        Returns:\n",
-    "            np.ndarray (float): an array of zeroes\n",
+    "            np.ndarray (float): An array of zeroes\n",
     "\n",
     "        \"\"\"\n",
     "        return np.zeros(self._num_features)\n"
diff --git a/evalml/pipelines/components/estimators/regressors/baseline_regressor.py b/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
index 264f5690b9..db8f7f6102 100644
--- a/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
+++ b/evalml/pipelines/components/estimators/regressors/baseline_regressor.py
@@ -24,7 +24,7 @@ def __init__(self, strategy="mean", random_state=0, **kwargs):
         """Baseline regressor that uses a simple strategy to make predictions.
 
         Arguments:
-            strategy (str): method used to predict. Valid options are "mean", "median". Defaults to "mean".
+            strategy (str): Method used to predict. Valid options are "mean", "median". Defaults to "mean".
             random_state (int): Seed for the random number generator. Defaults to 0.
 
         """
@@ -63,7 +63,7 @@ def feature_importance(self):
         """Returns importance associated with each feature. Since baseline regressors do not use input features to calculate predictions, returns an array of zeroes.
 
         Returns:
-            np.ndarray (float): an array of zeroes
+            np.ndarray (float): An array of zeroes
 
         """
         return np.zeros(self._num_features)