pyjanitor-devs · May 15, 2020
diff --git a/‎AUTHORS.rst
+2-1 b/‎AUTHORS.rst
+2-1
diff --git a/‎CHANGELOG.rst
+1 b/‎CHANGELOG.rst
+1
diff --git a/‎examples/convert_currency.md
+6-1 b/‎examples/convert_currency.md
+6-1
diff --git a/‎examples/filter_date.md
+2-6 b/‎examples/filter_date.md
+2-6
diff --git a/‎examples/make_currency_column_numeric.md
+10-3 b/‎examples/make_currency_column_numeric.md
+10-3
diff --git a/‎examples/notebooks/Row_to_Names.ipynb
+17-19 b/‎examples/notebooks/Row_to_Names.ipynb
+17-19
diff --git a/‎examples/notebooks/anime.ipynb
+49-48 b/‎examples/notebooks/anime.ipynb
+49-48
diff --git a/‎examples/notebooks/bad_values.ipynb
+28-29 b/‎examples/notebooks/bad_values.ipynb
+28-29
diff --git a/‎examples/notebooks/bird_call.ipynb
+47-34 b/‎examples/notebooks/bird_call.ipynb
+47-34
diff --git a/‎examples/notebooks/board_games.ipynb
+37-27 b/‎examples/notebooks/board_games.ipynb
+37-27
diff --git a/‎examples/notebooks/dirty_data.ipynb
+21-18 b/‎examples/notebooks/dirty_data.ipynb
+21-18
diff --git a/‎examples/notebooks/french_trains.ipynb
+60-42 b/‎examples/notebooks/french_trains.ipynb
+60-42
diff --git a/‎examples/notebooks/groupby_agg.ipynb
+19-15 b/‎examples/notebooks/groupby_agg.ipynb
+19-15
diff --git a/‎examples/notebooks/inflating_converting_currency.ipynb
+50-41 b/‎examples/notebooks/inflating_converting_currency.ipynb
+50-41
diff --git a/‎examples/notebooks/medium_franchise.ipynb
+224-234 b/‎examples/notebooks/medium_franchise.ipynb
+224-234
diff --git a/‎examples/notebooks/normalize.ipynb
+1,575-60 b/‎examples/notebooks/normalize.ipynb
+1,575-60
diff --git a/‎examples/notebooks/pyjanitor_intro.ipynb
+99-98 b/‎examples/notebooks/pyjanitor_intro.ipynb
+99-98
diff --git a/‎examples/notebooks/sort_naturally.ipynb
+11-18 b/‎examples/notebooks/sort_naturally.ipynb
+11-18
diff --git a/‎examples/notebooks/teacher_pupil.ipynb
+28-18 b/‎examples/notebooks/teacher_pupil.ipynb
+28-18
diff --git a/‎examples/notebooks/transform_column.ipynb
+88-31 b/‎examples/notebooks/transform_column.ipynb
+88-31
diff --git a/‎examples/round_to_fraction.md
-2 b/‎examples/round_to_fraction.md
-2
diff --git a/‎examples/row_to_names.md
-3 b/‎examples/row_to_names.md
-3
diff --git a/‎examples/then.md
+5-3 b/‎examples/then.md
+5-3
@@ -87,4 +87,5 @@ Contributors
 - `@DollofCuty <https://github.com/DollofCuty>`_ | `contributions <https://github.com/ericmjl/pyjanitor/pulls?utf8=%E2%9C%93&q=is%3Aclosed+mentions%3ADollofCuty>`_
 - `@bdice <https://github.com/bdice>`_ | `contributions <https://github.com/ericmjl/pyjanitor/pulls?utf8=%E2%9C%93&q=is%3Aclosed+mentions%3Abdice>`_
 - `@evan-anderson <https://github.com/evan-anderson>`_ | `contributions <https://github.com/ericmjl/pyjanitor/pulls?utf8=%E2%9C%93&q=is%3Aclosed+mentions%3evan-anderson>`_
-    `@smu095 <https://github.com/smu095>`_ | `contributions <https://github.com/ericmjl/pyjanitor/issues?q=is%3Aclosed+mentions%3smu095>`_
+- `@smu095 <https://github.com/smu095>`_ | `contributions <https://github.com/ericmjl/pyjanitor/issues?q=is%3Aclosed+mentions%3smu095>`_
+- `@VPerrollaz <https://github.com/VPerrollaz>`_ | `contributions <https://github.com/ericmjl/pyjanitor/issues?q=is%3Aclosed+mentions%3AVPerrollaz>`_
@@ -1,5 +1,6 @@
 new version (on deck)
 =====================
+- [DOC] pep8 all examples. @VPerrollaz
 - [TST]: Add docstrings to tests @hectormz
 - [INF]: Add ``debug-statements``, ``requirements-txt-fixer``, and ``interrogate`` to ``pre-commit``. @hectormz
 - [ENH]: Upgraded transform_column to use df.assign underneath the hood,
 
@@ -42,7 +42,12 @@ data_dict = {
  ```python
 example_dataframe = pd.DataFrame(data_dict)
 
-example_dataframe.convert_currency('a', from_currency='USD', to_currency='EUR', historical_date=date(2018,1,1))
+example_dataframe.convert_currency(
+    'a',
+    from_currency='USD',
+    to_currency='EUR',
+    historical_date=date(2018, 1, 1)
+)
 ```
 
 ### Output
 
@@ -66,8 +66,7 @@ date_list = [
     [26, "03/11/20"],
     [27, "03/12/20"]]
 
-example_dataframe = pd.DataFrame(date_list, columns = ['AMOUNT', 'DATE'])
-
+example_dataframe = pd.DataFrame(date_list, columns=['AMOUNT', 'DATE'])
 ```
 
 ## Example 1: Filter dataframe between two dates
@@ -102,7 +101,6 @@ example_dataframe.filter_date('DATE', end=end, format=format)
 ## Example 3: Filtering by year
 
 ```python
-
 years = [2019]
 
 example_dataframe.filter_date('DATE', years=years)
@@ -125,7 +123,6 @@ example_dataframe.filter_date('DATE', years=years)
 ## Example 4: Filtering by year and month
 
 ```python
-
 years = [2020]
 months = [3]
 
@@ -144,9 +141,8 @@ example_dataframe.filter_date('DATE', years=years, months=months)
 ## Example 5: Filtering by year and day
 
 ```python
-
 years = [2020]
-days = range(10,12)
+days = range(10, 12)
 
 example_dataframe.filter_date('DATE', years=years, days=days)
 ```
 
@@ -100,8 +100,11 @@ df.make_currency_column_numeric("a", fill_all_non_numeric=35)
 ## Example 4: Coerce numeric values in column to float, replace a string value with a specific value, and replace remaining string values with a specific value
 
 ```python
-df.make_currency_column_numeric("a", cast_non_numeric=cast_non_numeric, fill_all_non_numeric=35)
-
+df.make_currency_column_numeric(
+    "a",
+    cast_non_numeric=cast_non_numeric,
+    fill_all_non_numeric=35
+)
 ```
 
 ## Output
@@ -138,7 +141,11 @@ df.make_currency_column_numeric("a", remove_non_numeric=True)
 ## Example 6: Coerce numeric values in column to float, replace a string value with a specific value, and remove remaining string values
 
 ```python
-df.make_currency_column_numeric("a", cast_non_numeric=cast_non_numeric, remove_non_numeric=True)
+df.make_currency_column_numeric(
+    "a",
+    cast_non_numeric=cast_non_numeric,
+    remove_non_numeric=True
+)
 ```
 
 ## Output
 
@@ -23,7 +23,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -34,7 +34,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -48,7 +48,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [
     {
@@ -121,13 +121,13 @@
        "4             bag            305     25"
       ]
      },
-     "execution_count": 3,
+     "execution_count": 4,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "temp = pd.read_csv(StringIO(data), header= None)\n",
+    "temp = pd.read_csv(StringIO(data), header=None)\n",
     "temp"
    ]
   },
@@ -145,7 +145,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [
     {
@@ -211,15 +211,15 @@
        "4             bag          305    25"
       ]
      },
-     "execution_count": 4,
+     "execution_count": 5,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "temp.columns = temp.iloc[2,:]\n",
+    "temp.columns = temp.iloc[2, :]\n",
     "temp.columns = temp.columns.str.strip()\n",
-    "temp = temp.drop(2,axis=0)\n",
+    "temp = temp.drop(2, axis=0)\n",
     "temp = temp.rename_axis(None, axis='columns')\n",
     "temp"
    ]
@@ -233,7 +233,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [
     {
@@ -299,28 +299,26 @@
        "4             bag           305    25"
       ]
      },
-     "execution_count": 5,
+     "execution_count": 6,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "df = (pd\n",
-    "     .read_csv(StringIO(data),\n",
-    "               header= None)\n",
-    "     .row_to_names(row_number=2,\n",
-    "                   remove_row=True)\n",
-    "     )\n",
+    "df = (\n",
+    "    pd.read_csv(StringIO(data), header=None)\n",
+    "    .row_to_names(row_number=2, remove_row=True)\n",
+    ")\n",
     "\n",
     "df"
    ]
   }
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "PyJanitor development",
+   "display_name": "Python 3",
    "language": "python",
-   "name": "pyjanitor-dev"
+   "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
 
@@ -15,7 +15,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -33,7 +33,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [
     {
@@ -231,13 +231,15 @@
        "[5 rows x 24 columns]"
       ]
      },
-     "execution_count": 2,
+     "execution_count": 4,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "wind = pd.read_csv(\"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2018/2018-11-06/us_wind.csv\")\n",
+    "wind = pd.read_csv(\n",
+    "    \"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2018/2018-11-06/us_wind.csv\"\n",
+    ")\n",
     "wind.head()"
    ]
   },
@@ -250,7 +252,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [
     {
@@ -259,7 +261,7 @@
        "-1069.986537767466"
       ]
      },
-     "execution_count": 3,
+     "execution_count": 5,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -278,7 +280,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 6,
    "metadata": {
     "scrolled": true
    },
@@ -289,7 +291,7 @@
        "['usgs_pr_id', 'p_year', 'p_cap', 't_cap', 't_hh', 't_rd', 't_rsa', 't_ttlh']"
       ]
      },
-     "execution_count": 4,
+     "execution_count": 6,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -315,7 +317,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 7,
    "metadata": {},
    "outputs": [
     {
@@ -513,7 +515,7 @@
        "[5 rows x 24 columns]"
       ]
      },
-     "execution_count": 5,
+     "execution_count": 7,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -523,8 +525,8 @@
     "wind2 = (\n",
     "    wind\n",
     "    .find_replace(\n",
-    "        usgs_pr_id=mapping, \n",
-    "        p_tnum=mapping, \n",
+    "        usgs_pr_id=mapping,\n",
+    "        p_tnum=mapping,\n",
     "        p_cap=mapping,\n",
     "        t_cap=mapping,\n",
     "        t_hh=mapping,\n",
@@ -545,7 +547,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [
     {
@@ -554,7 +556,7 @@
        "77.31203064391"
       ]
      },
-     "execution_count": 6,
+     "execution_count": 8,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -596,21 +598,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [],
    "source": [
     "# Note that update_where mutates the original dataframe\n",
-    "(wind\n",
-    "    .update_where(\n",
-    "        (wind['p_year'] < 1887) | (wind['p_year'] > 2018),\n",
-    "         'p_year', np.nan)\n",
-    "    .update_where(\n",
-    "        (wind['t_hh'] <= 0) | (wind['t_hh'] >= 1000),\n",
-    "         't_hh', np.nan)\n",
-    "     .update_where(\n",
-    "        (wind['xlong'] < -161.76) | (wind['xlong'] > -68.01),\n",
-    "         'xlong', np.nan));"
+    "(\n",
+    "    wind.update_where(\n",
+    "        (wind['p_year'] < 1887) | (wind['p_year'] > 2018), 'p_year', np.nan\n",
+    "    )\n",
+    "    .update_where((wind['t_hh'] <= 0) | (wind['t_hh'] >= 1000), 't_hh', np.nan)\n",
+    "    .update_where((wind['xlong'] < -161.76) | (wind['xlong'] > -68.01), 'xlong', np.nan)\n",
+    ");"
    ]
   },
   {
@@ -622,7 +621,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 10,
    "metadata": {},
    "outputs": [
     {
@@ -631,7 +630,7 @@
        "77.31203064391"
       ]
      },
-     "execution_count": 8,
+     "execution_count": 10,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -643,9 +642,9 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "pyjanitor-dev",
+   "display_name": "Python 3",
    "language": "python",
-   "name": "pyjanitor-dev"
+   "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
 
@@ -34,7 +34,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -53,13 +53,20 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [],
    "source": [
-    "raw_birds = pd.read_csv(\"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2019/2019-04-30/raw/Chicago_collision_data.csv\")\n",
-    "raw_call = pd.read_csv(\"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2019/2019-04-30/raw/bird_call.csv\", sep=\" \")\n",
-    "raw_light = pd.read_csv(\"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2019/2019-04-30/raw/Light_levels_dryad.csv\")"
+    "raw_birds = pd.read_csv(\n",
+    "    \"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2019/2019-04-30/raw/Chicago_collision_data.csv\"\n",
+    ")\n",
+    "raw_call = pd.read_csv(\n",
+    "    \"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2019/2019-04-30/raw/bird_call.csv\", \n",
+    "    sep=\" \"\n",
+    ")\n",
+    "raw_light = pd.read_csv(\n",
+    "    \"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2019/2019-04-30/raw/Light_levels_dryad.csv\"\n",
+    ")"
    ]
   },
   {
@@ -73,7 +80,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [
     {
@@ -152,7 +159,7 @@
        "4  Ammodramus  nelsoni  1986-09-10       MP"
       ]
      },
-     "execution_count": 3,
+     "execution_count": 5,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -163,7 +170,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [
     {
@@ -260,7 +267,7 @@
        "4      Seiurus  aurocapilla      Parulidae    4580  Yes  Forest   Lower"
       ]
      },
-     "execution_count": 4,
+     "execution_count": 6,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -271,7 +278,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 7,
    "metadata": {},
    "outputs": [
     {
@@ -338,7 +345,7 @@
        "4  2000-04-02           17"
       ]
      },
-     "execution_count": 5,
+     "execution_count": 7,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -363,7 +370,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -372,7 +379,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [
     {
@@ -439,7 +446,7 @@
        "4  2000-04-02           17"
       ]
      },
-     "execution_count": 7,
+     "execution_count": 9,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -457,20 +464,20 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 10,
    "metadata": {},
    "outputs": [],
    "source": [
     "clean_call = (\n",
     "    raw_call\n",
-    "    .rename_column(\"Species\", \"Genus\") # rename 'Species' column to 'Genus'\n",
-    "    .rename_column(\"Family\", \"Species\") # rename 'Family' columnto 'Species'\n",
+    "    .rename_column(\"Species\", \"Genus\")  # rename 'Species' column to 'Genus'\n",
+    "    .rename_column(\"Family\", \"Species\")  # rename 'Family' columnto 'Species'\n",
     ")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 11,
    "metadata": {},
    "outputs": [
     {
@@ -567,7 +574,7 @@
        "4      Seiurus  aurocapilla      Parulidae    4580  Yes  Forest   Lower"
       ]
      },
-     "execution_count": 9,
+     "execution_count": 11,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -585,24 +592,35 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 10,
+   "execution_count": 12,
    "metadata": {},
    "outputs": [],
    "source": [
     "clean_birds = (\n",
     "    raw_birds\n",
-    "    .merge(clean_call, how='left') # merge the raw_birds dataframe with clean_raw dataframe\n",
-    "    .select_columns([\"Genus\", \"Species\", \"Date\", \"Locality\", \"Collisions\", \"Call\", \"Habitat\", \"Stratum\"]) # include list of cols\n",
-    "    .clean_names() \n",
-    "    .rename_column(\"collisions\", \"family\") # rename 'collisions' column to 'family' in merged dataframe\n",
+    "    .merge(clean_call, how='left')  # merge the raw_birds dataframe with clean_raw dataframe\n",
+    "    .select_columns(\n",
+    "        [\n",
+    "            \"Genus\",\n",
+    "            \"Species\",\n",
+    "            \"Date\",\n",
+    "            \"Locality\",\n",
+    "            \"Collisions\",\n",
+    "            \"Call\",\n",
+    "            \"Habitat\",\n",
+    "            \"Stratum\"\n",
+    "        ]\n",
+    "    )  # include list of cols\n",
+    "    .clean_names()\n",
+    "    .rename_column(\"collisions\", \"family\")  # rename 'collisions' column to 'family' in merged dataframe\n",
     "    .rename_column(\"call\", \"flight_call\")\n",
-    "    .dropna() # drop all rows which contain a NaN\n",
+    "    .dropna()  # drop all rows which contain a NaN\n",
     ")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 11,
+   "execution_count": 13,
    "metadata": {},
    "outputs": [
     {
@@ -712,19 +730,14 @@
        "93         Yes    Open  Lower\\t  "
       ]
      },
-     "execution_count": 11,
+     "execution_count": 13,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
     "clean_birds.head()"
    ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": []
   }
  ],
  "metadata": {
@@ -743,9 +756,9 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.3"
+   "version": "3.7.6"
   }
  },
  "nbformat": 4,
- "nbformat_minor": 2
+ "nbformat_minor": 4
 }
@@ -27,7 +27,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -44,7 +44,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [
     {
@@ -315,7 +315,7 @@
        "12              NaN  "
       ]
      },
-     "execution_count": 2,
+     "execution_count": 4,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -336,7 +336,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [
     {
@@ -416,7 +416,7 @@
        "1        Yes             NaN   Physical ed         Theater              NaN  "
       ]
      },
-     "execution_count": 3,
+     "execution_count": 5,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -442,7 +442,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [
     {
@@ -544,7 +544,7 @@
        "8         No       PENDING             NaN  "
       ]
      },
-     "execution_count": 4,
+     "execution_count": 6,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -572,7 +572,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 7,
    "metadata": {},
    "outputs": [
     {
@@ -688,7 +688,7 @@
        "4               1.00       Yes       PENDING             NaN  "
       ]
      },
-     "execution_count": 5,
+     "execution_count": 7,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -723,7 +723,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [
     {
@@ -832,7 +832,7 @@
        "11   Vocal music         English"
       ]
      },
-     "execution_count": 6,
+     "execution_count": 8,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -850,7 +850,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [
     {
@@ -1051,7 +1051,7 @@
        "11               0.80        No     Vocal music  "
       ]
      },
-     "execution_count": 7,
+     "execution_count": 9,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1063,7 +1063,10 @@
     "    .remove_empty()\n",
     "    .rename_column(\"%_allocated\", \"percent_allocated\")\n",
     "    .rename_column(\"full_time_\", \"full_time\")\n",
-    "    .coalesce(column_names=['certification', 'certification_1'], new_column_name='certification')\n",
+    "    .coalesce(\n",
+    "        column_names=['certification', 'certification_1'],\n",
+    "        new_column_name='certification'\n",
+    "    )\n",
     ")\n",
     "\n",
     "df_clean"
@@ -1088,7 +1091,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 10,
    "metadata": {},
    "outputs": [
     {
@@ -1289,7 +1292,7 @@
        "11               0.80        No     Vocal music  "
       ]
      },
-     "execution_count": 8,
+     "execution_count": 10,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1331,9 +1334,9 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.3"
+   "version": "3.7.6"
   }
  },
  "nbformat": 4,
- "nbformat_minor": 2
+ "nbformat_minor": 4
 }
@@ -32,18 +32,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [],
    "source": [
-    "#load modules\n",
+    "# load modules\n",
     "import pandas as pd\n",
     "from janitor import groupby_agg"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [
     {
@@ -116,15 +116,17 @@
        "4   bag  305           25"
       ]
      },
-     "execution_count": 2,
+     "execution_count": 3,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "data = {'item':['shoe','shoe','bag','shoe','bag'],\n",
-    "                'MRP':[220,450,320,200,305],\n",
-    "                'number_sold':[100,40,56,38,25]}\n",
+    "data = {\n",
+    "    'item': ['shoe', 'shoe', 'bag', 'shoe', 'bag'],\n",
+    "    'MRP': [220, 450, 320, 200, 305],\n",
+    "    'number_sold': [100, 40, 56, 38, 25]\n",
+    "}\n",
     "\n",
     "df = pd.DataFrame(data)\n",
     "\n",
@@ -140,7 +142,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [
     {
@@ -219,26 +221,28 @@
        "4   bag  305           25    312.5"
       ]
      },
-     "execution_count": 3,
+     "execution_count": 4,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "df = df.groupby_agg(by='item',\n",
-    "                    agg='mean',\n",
-    "                    agg_column_name='MRP',\n",
-    "                    new_column_name='Avg_MRP')\n",
+    "df = df.groupby_agg(\n",
+    "    by='item',\n",
+    "    agg='mean',\n",
+    "    agg_column_name='MRP',\n",
+    "    new_column_name='Avg_MRP'\n",
+    ")\n",
     "\n",
     "df"
    ]
   }
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "PyJanitor development",
+   "display_name": "Python 3",
    "language": "python",
-   "name": "pyjanitor-dev"
+   "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
 
@@ -9,13 +9,13 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [],
    "source": [
     "import pandas_flavor as pf\n",
     "import pandas as pd\n",
-    "import janitor\n"
+    "import janitor"
    ]
   },
   {
@@ -27,7 +27,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [
     {
@@ -100,15 +100,15 @@
        "5  B12      7"
       ]
      },
-     "execution_count": 7,
+     "execution_count": 3,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
     "data = {\n",
     "    \"Well\": [\"A21\", \"A3\", \"A21\", \"B2\", \"B51\", \"B12\"],\n",
-    "    \"Value\":[   1,    2,     13,   3,    4,      7],\n",
+    "    \"Value\": [1, 2, 13, 3, 4, 7],\n",
     "}\n",
     "df = pd.DataFrame(data)\n",
     "df"
@@ -127,7 +127,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [
     {
@@ -200,7 +200,7 @@
        "4  B51      4"
       ]
      },
-     "execution_count": 8,
+     "execution_count": 4,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -218,7 +218,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [
     {
@@ -291,7 +291,7 @@
        "4  B51      4"
       ]
      },
-     "execution_count": 9,
+     "execution_count": 5,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -306,20 +306,13 @@
    "source": [
     "Now we're in sorting bliss! :)"
    ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
   }
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "pyjanitor-dev",
+   "display_name": "Python 3",
    "language": "python",
-   "name": "pyjanitor-dev"
+   "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
 
@@ -23,7 +23,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
    "metadata": {
     "pycharm": {
      "is_executing": false,
@@ -145,7 +145,7 @@
        "4  Democratic Republic of the Congo  2012  2012  34.74758        NaN   NaN  "
       ]
      },
-     "execution_count": 1,
+     "execution_count": 2,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -155,8 +155,10 @@
     "import pandas as pd\n",
     "import pandas_flavor as pf\n",
     "\n",
-    "dirty_csv = \"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2019/2019-05-07/EDULIT_DS_06052019101747206.csv\"\n",
-    "dirty_df= pd.read_csv(dirty_csv)\n",
+    "dirty_csv = (\n",
+    "    \"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2019/2019-05-07/EDULIT_DS_06052019101747206.csv\"\n",
+    ")\n",
+    "dirty_df = pd.read_csv(dirty_csv)\n",
     "dirty_df.head()\n"
    ]
   },
@@ -186,7 +188,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [
     {
@@ -201,7 +203,7 @@
        " 'Pupil-teacher ratio in upper secondary education (headcount basis)'}"
       ]
      },
-     "execution_count": 2,
+     "execution_count": 3,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -229,7 +231,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 4,
    "metadata": {
     "pycharm": {
      "is_executing": false,
@@ -264,14 +266,20 @@
     "def drop_duplicated_column(df, column_name: str, column_order: int=0):\n",
     "    \"\"\"Remove duplicated columns and retain only a column given its order.\n",
     "    Order 0 is to remove the first column, Order 1 is to remove the second column, and etc\"\"\"\n",
-    "    \n",
+    "\n",
     "    cols = list(df.columns)\n",
-    "    col_indexes = [col_idx for col_idx, col_name in enumerate(cols) if col_name == column_name]\n",
-    "    \n",
+    "    col_indexes = [\n",
+    "        col_idx for col_idx,\n",
+    "        col_name in enumerate(cols) if col_name == column_name\n",
+    "    ]\n",
+    "\n",
     "    # given that a column could be duplicated, user could opt based on its order\n",
     "    removed_col_idx = col_indexes[column_order]\n",
     "    # get the column indexes without column that is being removed\n",
-    "    filtered_cols = [c_i for c_i, c_v in enumerate(cols) if c_i != removed_col_idx]\n",
+    "    filtered_cols = [\n",
+    "        c_i for c_i,\n",
+    "        c_v in enumerate(cols) if c_i != removed_col_idx\n",
+    "    ]\n",
     "    return df.iloc[:, filtered_cols]\n",
     "\n"
    ]
@@ -285,7 +293,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [
     {
@@ -395,7 +403,7 @@
        "4  Democratic Republic of the Congo  2012       34.74758        NaN   NaN  "
       ]
      },
-     "execution_count": 4,
+     "execution_count": 5,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -412,7 +420,7 @@
     "    .str_trim(\"country\")\n",
     "    .str_title(\"indicator\")\n",
     "    # remove `time` column (which is duplicated). The second `time` is being removed\n",
-    "    .drop_duplicated_column(\"time\", 1) \n",
+    "    .drop_duplicated_column(\"time\", 1)\n",
     "    # renaming columns\n",
     "    .rename_column(\"location\", \"country_code\")\n",
     "    .rename_column(\"value\", \"student_ratio\")\n",
@@ -424,7 +432,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 6,
    "metadata": {
     "pycharm": {
      "is_executing": false,
@@ -435,7 +443,9 @@
    "outputs": [],
    "source": [
     "# ensure that the output from janitor is similar with the clean r's janitor\n",
-    "r_clean_csv = \"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2019/2019-05-07/student_teacher_ratio.csv\"\n",
+    "r_clean_csv = (\n",
+    "    \"https://raw.githubusercontent.com/rfordatascience/tidytuesday/master/data/2019/2019-05-07/student_teacher_ratio.csv\"\n",
+    ")\n",
     "r_clean_df = pd.read_csv(r_clean_csv)\n",
     "\n",
     "pd.testing.assert_frame_equal(r_clean_df, py_clean_df)"
@@ -458,7 +468,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.7.3"
+   "version": "3.7.6"
   },
   "stem_cell": {
    "cell_type": "raw",
@@ -471,5 +481,5 @@
   }
  },
  "nbformat": 4,
- "nbformat_minor": 2
+ "nbformat_minor": 4
 }
@@ -2,7 +2,7 @@
  "cells": [
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -32,7 +32,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -50,7 +50,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -59,7 +59,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -75,9 +75,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "1.86 s ± 102 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
+     ]
+    }
+   ],
    "source": [
     "%%timeit\n",
     "# We are using a lambda function that operates on each element,\n",
@@ -94,9 +102,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 7,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "15.7 ms ± 1.01 ms per loop (mean ± std. dev. of 7 runs, 100 loops each)\n"
+     ]
+    }
+   ],
    "source": [
     "%%timeit\n",
     "df.transform_column(\"0\", lambda s: np.abs(s), elementwise=False)"
@@ -126,7 +142,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -149,7 +165,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -159,39 +175,71 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 10,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "408 ms ± 13.3 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
+     ]
+    }
+   ],
    "source": [
     "%%timeit\n",
     "stringdf.assign(data=first_five(stringdf[\"data\"]))"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 11,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "293 ms ± 4.29 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
+     ]
+    }
+   ],
    "source": [
     "%%timeit\n",
     "first_five(stringdf[\"data\"])"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 12,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "295 ms ± 10 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
+     ]
+    }
+   ],
    "source": [
     "%%timeit\n",
     "stringdf[\"data\"].str[0:5]"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 13,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "301 ms ± 7.18 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
+     ]
+    }
+   ],
    "source": [
     "%%timeit\n",
     "stringdf[\"data\"].apply(lambda x: x[0:5])"
@@ -208,9 +256,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 14,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "409 ms ± 10.1 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
+     ]
+    }
+   ],
    "source": [
     "%%timeit\n",
     "stringdf.transform_column(\"data\", lambda x: x[0:5])"
@@ -225,27 +281,28 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 15,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "403 ms ± 7.55 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)\n"
+     ]
+    }
+   ],
    "source": [
     "%%timeit\n",
     "stringdf.transform_column(\"data\", first_five, elementwise=False)"
    ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
   }
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "pyjanitor-dev",
+   "display_name": "Python 3",
    "language": "python",
-   "name": "pyjanitor-dev"
+   "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
 
@@ -50,7 +50,6 @@ example_dataframe.round_to_fraction('a', 2)
 ## Example 2: Rounding the first column to nearest third
 
 ```python
-
 example_dataframe2 = pd.DataFrame(data_dict)
 
 example_dataframe2.limit_column_characters('a', 3)
@@ -72,7 +71,6 @@ example_dataframe2.limit_column_characters('a', 3)
 ## Example 3: Rounding the first column to the nearest third and rounding each value to the 10,000th place
 
 ```python
-
 example_dataframe2 = pd.DataFrame(data_dict)
 
 example_dataframe2.limit_column_characters('a', 3, 4)
 
@@ -25,7 +25,6 @@ Remove the rows from the index above `row_number`.
 ## Setup
 
 ```python
-
 import pandas as pd
 import janitor
 
@@ -63,7 +62,6 @@ example_dataframe.row_to_names(0)
 ## Example2: Move first row to column names and remove row
 
 ```python
-
 example_dataframe = pd.DataFrame(data_dict)
 
 example_dataframe.row_to_names(0, remove_row=True)
@@ -84,7 +82,6 @@ example_dataframe.row_to_names(0, remove_row=True)
 ## Example3: Move first row to column names, remove row, and remove rows above selected row
 
 ```python
-
 example_dataframe = pd.DataFrame(data_dict)
 
 example_dataframe.row_to_names(2, remove_row=True, remove_rows_above=True)
 
@@ -80,9 +80,11 @@ example_dataframe2.then(remove_rows_3_and_4)
 
 ```python
 example_dataframe = pd.DataFrame(data_dict)
-example_dataframe = (example_dataframe
-                    .then(remove_first_two_letters_from_col_names)
-                    .then(remove_rows_3_and_4))
+example_dataframe = (
+    example_dataframe
+    .then(remove_first_two_letters_from_col_names)
+    .then(remove_rows_3_and_4)
+)
 ```
 
 ### Output
Original file line number	Diff line number	Diff line change
`@@ -27,7 +27,7 @@`
`27`	`27`	`},`
`28`	`28`	`{`
`29`	`29`	`"cell_type": "code",`
`30`		`- "execution_count": 1,`
	`30`	`+ "execution_count": 2,`
`31`	`31`	`"metadata": {},`
`32`	`32`	`"outputs": [],`
`33`	`33`	`"source": [`
`@@ -44,7 +44,7 @@`
`44`	`44`	`},`
`45`	`45`	`{`
`46`	`46`	`"cell_type": "code",`
`47`		`- "execution_count": 2,`
	`47`	`+ "execution_count": 4,`
`48`	`48`	`"metadata": {},`
`49`	`49`	`"outputs": [`
`50`	`50`	`{`
`@@ -315,7 +315,7 @@`
`315`	`315`	`"12 NaN "`
`316`	`316`	`]`
`317`	`317`	`},`
`318`		`- "execution_count": 2,`
	`318`	`+ "execution_count": 4,`
`319`	`319`	`"metadata": {},`
`320`	`320`	`"output_type": "execute_result"`
`321`	`321`	`}`
`@@ -336,7 +336,7 @@`
`336`	`336`	`},`
`337`	`337`	`{`
`338`	`338`	`"cell_type": "code",`
`339`		`- "execution_count": 3,`
	`339`	`+ "execution_count": 5,`
`340`	`340`	`"metadata": {},`
`341`	`341`	`"outputs": [`
`342`	`342`	`{`
`@@ -416,7 +416,7 @@`
`416`	`416`	`"1 Yes NaN Physical ed Theater NaN "`
`417`	`417`	`]`
`418`	`418`	`},`
`419`		`- "execution_count": 3,`
	`419`	`+ "execution_count": 5,`
`420`	`420`	`"metadata": {},`
`421`	`421`	`"output_type": "execute_result"`
`422`	`422`	`}`
`@@ -442,7 +442,7 @@`
`442`	`442`	`},`
`443`	`443`	`{`
`444`	`444`	`"cell_type": "code",`
`445`		`- "execution_count": 4,`
	`445`	`+ "execution_count": 6,`
`446`	`446`	`"metadata": {},`
`447`	`447`	`"outputs": [`
`448`	`448`	`{`
`@@ -544,7 +544,7 @@`
`544`	`544`	`"8 No PENDING NaN "`
`545`	`545`	`]`
`546`	`546`	`},`
`547`		`- "execution_count": 4,`
	`547`	`+ "execution_count": 6,`
`548`	`548`	`"metadata": {},`
`549`	`549`	`"output_type": "execute_result"`
`550`	`550`	`}`
`@@ -572,7 +572,7 @@`
`572`	`572`	`},`
`573`	`573`	`{`
`574`	`574`	`"cell_type": "code",`
`575`		`- "execution_count": 5,`
	`575`	`+ "execution_count": 7,`
`576`	`576`	`"metadata": {},`
`577`	`577`	`"outputs": [`
`578`	`578`	`{`
`@@ -688,7 +688,7 @@`
`688`	`688`	`"4 1.00 Yes PENDING NaN "`
`689`	`689`	`]`
`690`	`690`	`},`
`691`		`- "execution_count": 5,`
	`691`	`+ "execution_count": 7,`
`692`	`692`	`"metadata": {},`
`693`	`693`	`"output_type": "execute_result"`
`694`	`694`	`}`
`@@ -723,7 +723,7 @@`
`723`	`723`	`},`
`724`	`724`	`{`
`725`	`725`	`"cell_type": "code",`
`726`		`- "execution_count": 6,`
	`726`	`+ "execution_count": 8,`
`727`	`727`	`"metadata": {},`
`728`	`728`	`"outputs": [`
`729`	`729`	`{`
`@@ -832,7 +832,7 @@`
`832`	`832`	`"11 Vocal music English"`
`833`	`833`	`]`
`834`	`834`	`},`
`835`		`- "execution_count": 6,`
	`835`	`+ "execution_count": 8,`
`836`	`836`	`"metadata": {},`
`837`	`837`	`"output_type": "execute_result"`
`838`	`838`	`}`
`@@ -850,7 +850,7 @@`
`850`	`850`	`},`
`851`	`851`	`{`
`852`	`852`	`"cell_type": "code",`
`853`		`- "execution_count": 7,`
	`853`	`+ "execution_count": 9,`
`854`	`854`	`"metadata": {},`
`855`	`855`	`"outputs": [`
`856`	`856`	`{`
`@@ -1051,7 +1051,7 @@`
`1051`	`1051`	`"11 0.80 No Vocal music "`
`1052`	`1052`	`]`
`1053`	`1053`	`},`
`1054`		`- "execution_count": 7,`
	`1054`	`+ "execution_count": 9,`
`1055`	`1055`	`"metadata": {},`
`1056`	`1056`	`"output_type": "execute_result"`
`1057`	`1057`	`}`
`@@ -1063,7 +1063,10 @@`
`1063`	`1063`	`" .remove_empty()\n",`
`1064`	`1064`	`" .rename_column(\"%_allocated\", \"percent_allocated\")\n",`
`1065`	`1065`	`" .rename_column(\"full_time_\", \"full_time\")\n",`
`1066`		`- " .coalesce(column_names=['certification', 'certification_1'], new_column_name='certification')\n",`
	`1066`	`+ " .coalesce(\n",`
	`1067`	`+ " column_names=['certification', 'certification_1'],\n",`
	`1068`	`+ " new_column_name='certification'\n",`
	`1069`	`+ " )\n",`
`1067`	`1070`	`")\n",`
`1068`	`1071`	`"\n",`
`1069`	`1072`	`"df_clean"`
`@@ -1088,7 +1091,7 @@`
`1088`	`1091`	`},`
`1089`	`1092`	`{`
`1090`	`1093`	`"cell_type": "code",`
`1091`		`- "execution_count": 8,`
	`1094`	`+ "execution_count": 10,`
`1092`	`1095`	`"metadata": {},`
`1093`	`1096`	`"outputs": [`
`1094`	`1097`	`{`
`@@ -1289,7 +1292,7 @@`
`1289`	`1292`	`"11 0.80 No Vocal music "`
`1290`	`1293`	`]`
`1291`	`1294`	`},`
`1292`		`- "execution_count": 8,`
	`1295`	`+ "execution_count": 10,`
`1293`	`1296`	`"metadata": {},`
`1294`	`1297`	`"output_type": "execute_result"`
`1295`	`1298`	`}`
`@@ -1331,9 +1334,9 @@`
`1331`	`1334`	`"name": "python",`
`1332`	`1335`	`"nbconvert_exporter": "python",`
`1333`	`1336`	`"pygments_lexer": "ipython3",`
`1334`		`- "version": "3.7.3"`
	`1337`	`+ "version": "3.7.6"`
`1335`	`1338`	`}`
`1336`	`1339`	`},`
`1337`	`1340`	`"nbformat": 4,`
`1338`		`- "nbformat_minor": 2`
	`1341`	`+ "nbformat_minor": 4`
`1339`	`1342`	`}`