In [21]:
# Import the modules
import numpy as np
import pandas as pd
from pathlib import Path
from sklearn.metrics import confusion_matrix, classification_report

---

## Split the Data into Training and Testing Sets

### Step 1: Read the `lending_data.csv` data from the `Resources` folder into a Pandas DataFrame.

In [22]:
# Read the CSV file from the Resources folder into a Pandas DataFrame
mushroom_data_df = pd.read_csv('agaricus-lepiota.data')

# Review the DataFrame
mushroom_data_df

Unnamed: 0,classes,capshape,capsurface,capcolor,bruises,odor,gillattachment,gillspacing,gillsize,gillcolor,...,stalk-surface-below-ring,stalk-color-above-ring,stalk-color-below-ring,veil-type,veil-color,ring-number,ring-type,spore-print-color,population,habitat
0,p,x,s,n,t,p,f,c,n,k,...,s,w,w,p,w,o,p,k,s,u
1,e,x,s,y,t,a,f,c,b,k,...,s,w,w,p,w,o,p,n,n,g
2,e,b,s,w,t,l,f,c,b,n,...,s,w,w,p,w,o,p,n,n,m
3,p,x,y,w,t,p,f,c,n,n,...,s,w,w,p,w,o,p,k,s,u
4,e,x,s,g,f,n,f,w,b,k,...,s,w,w,p,w,o,e,n,a,g
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8119,e,k,s,n,f,n,a,c,b,y,...,s,o,o,p,o,o,p,b,c,l
8120,e,x,s,n,f,n,a,c,b,y,...,s,o,o,p,n,o,p,b,v,l
8121,e,f,s,n,f,n,a,c,b,n,...,s,o,o,p,o,o,p,b,c,l
8122,p,k,y,n,f,y,f,c,n,b,...,k,w,w,p,w,o,e,w,v,l


In [23]:
# Rename all letters in table
# Classes:
mushroom_data_df['classes'] = mushroom_data_df['classes'].replace({'e': 'edible'})
mushroom_data_df['classes'] = mushroom_data_df['classes'].replace({'p': 'poisonous'})

mushroom_data_df

Unnamed: 0,classes,capshape,capsurface,capcolor,bruises,odor,gillattachment,gillspacing,gillsize,gillcolor,...,stalk-surface-below-ring,stalk-color-above-ring,stalk-color-below-ring,veil-type,veil-color,ring-number,ring-type,spore-print-color,population,habitat
0,poisonous,x,s,n,t,p,f,c,n,k,...,s,w,w,p,w,o,p,k,s,u
1,edible,x,s,y,t,a,f,c,b,k,...,s,w,w,p,w,o,p,n,n,g
2,edible,b,s,w,t,l,f,c,b,n,...,s,w,w,p,w,o,p,n,n,m
3,poisonous,x,y,w,t,p,f,c,n,n,...,s,w,w,p,w,o,p,k,s,u
4,edible,x,s,g,f,n,f,w,b,k,...,s,w,w,p,w,o,e,n,a,g
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8119,edible,k,s,n,f,n,a,c,b,y,...,s,o,o,p,o,o,p,b,c,l
8120,edible,x,s,n,f,n,a,c,b,y,...,s,o,o,p,n,o,p,b,v,l
8121,edible,f,s,n,f,n,a,c,b,n,...,s,o,o,p,o,o,p,b,c,l
8122,poisonous,k,y,n,f,y,f,c,n,b,...,k,w,w,p,w,o,e,w,v,l


In [26]:
mushroom_data_df.loc['classes']

KeyError: 'classes'

In [24]:
# Cap-shape
mushroom_data_df['capshape'] = mushroom_data_df['capshape'].replace({'x: convex'})



KeyError: 'capshape'

In [None]:
# Cap-surface
mushroom_data_df['cap-surface'] = mushroom_data_df['cap-surface'].replace({'f': 'fibrous'})
mushroom_data_df['cap-surface'] = mushroom_data_df['cap-surface'].replace({'g': 'grooves'})
mushroom_data_df['cap-surface'] = mushroom_data_df['cap-surface'].replace({'y': 'scaly'})
mushroom_data_df['cap-surface'] = mushroom_data_df['cap-surface'].replace({'s': 'smooth'})

# Cap-color
mushroom_data_df['cap-color'] = mushroom_data_df['cap-color'].replace({'n': 'brown'})
mushroom_data_df['cap-color'] = mushroom_data_df['cap-color'].replace({'b': 'buff'})
mushroom_data_df['cap-color'] = mushroom_data_df['cap-color'].replace({'c': 'cinnamon'})
mushroom_data_df['cap-color'] = mushroom_data_df['cap-color'].replace({'g': 'gray'})
mushroom_data_df['cap-color'] = mushroom_data_df['cap-color'].replace({'r': 'green'})
mushroom_data_df['cap-color'] = mushroom_data_df['cap-color'].replace({'p': 'pink'})
mushroom_data_df['cap-color'] = mushroom_data_df['cap-color'].replace({'u': 'purple'})
mushroom_data_df['cap-color'] = mushroom_data_df['cap-color'].replace({'e': 'red'})
mushroom_data_df['cap-color'] = mushroom_data_df['cap-color'].replace({'w': 'white'})
mushroom_data_df['cap-color'] = mushroom_data_df['cap-color'].replace({'y': 'yellow'})
# Bruises?
mushroom_data_df['bruises?'] = mushroom_data_df['bruises?'].replace({'t': 'bruises'})
mushroom_data_df['bruises?'] = mushroom_data_df['bruises?'].replace({'f': 'no'})

# Odor:
mushroom_data_df['odor'] = mushroom_data_df['odor'].replace({'a': 'almond'})
mushroom_data_df['odor'] = mushroom_data_df['odor'].replace({'l': 'anise'})
mushroom_data_df['odor'] = mushroom_data_df['odor'].replace({'c': 'creosote'})
mushroom_data_df['odor'] = mushroom_data_df['odor'].replace({'y': 'fishy'})
mushroom_data_df['odor'] = mushroom_data_df['odor'].replace({'f': 'foul'})
mushroom_data_df['odor'] = mushroom_data_df['odor'].replace({'m': 'musty'})
mushroom_data_df['odor'] = mushroom_data_df['odor'].replace({'n': 'none'})
mushroom_data_df['odor'] = mushroom_data_df['odor'].replace({'p': 'pungent'})
mushroom_data_df['odor'] = mushroom_data_df['odor'].replace({'s': 'spicy'})

# Gill-attachment
mushroom_data_df['gill-attachment'] = mushroom_data_df['gill-attachment'].replace({'a': 'attached'})
mushroom_data_df['gill-attachment'] = mushroom_data_df['gill-attachment'].replace({'d': 'descending'})
mushroom_data_df['gill-attachment'] = mushroom_data_df['gill-attachment'].replace({'f': 'free'})
mushroom_data_df['gill-attachment'] = mushroom_data_df['gill-attachment'].replace({'n': 'notched'})

# Gill-spacing
mushroom_data_df['gill-spacing'] = mushroom_data_df['gill-spacing'].replace({'c': 'close'})
mushroom_data_df['gill-spacing'] = mushroom_data_df['gill-spacing'].replace({'w': 'crowded'})
mushroom_data_df['gill-spacing'] = mushroom_data_df['gill-spacing'].replace({'d': 'distant'})

# Gill-size
mushroom_data_df['gill-size'] = mushroom_data_df['gill-size'].replace({'b': 'broad'})
mushroom_data_df['gill-size'] = mushroom_data_df['gill-size'].replace({'n': 'narrow'})

# Gill-color
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'k': 'black'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'n': 'brown'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'b': 'buff'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'h': 'chocolate'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'g': 'gray'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'r': 'green'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'o': 'orange'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'p': 'pink'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'u': 'purple'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'e': 'red'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'w': 'white'})
mushroom_data_df['gill-color'] = mushroom_data_df['gill-color'].replace({'y': 'yellow'})

# Stalk-shape
mushroom_data_df['stalk-shape'] = mushroom_data_df['stalk-shape'].replace({'e': 'enlarging'})
mushroom_data_df['stalk-shape'] = mushroom_data_df['stalk-shape'].replace({'t': 'tapering'})

# stalk-root
mushroom_data_df['stalk-root'] = mushroom_data_df['stalk-root'].replace({'b': 'bulbous'})
mushroom_data_df['stalk-root'] = mushroom_data_df['stalk-root'].replace({'c': 'club'})
mushroom_data_df['stalk-root'] = mushroom_data_df['stalk-root'].replace({'u': 'cup'})
mushroom_data_df['stalk-root'] = mushroom_data_df['stalk-root'].replace({'e': 'equal'})
mushroom_data_df['stalk-root'] = mushroom_data_df['stalk-root'].replace({'z': 'rhizoporphs'})
mushroom_data_df['stalk-root'] = mushroom_data_df['stalk-root'].replace({'r': 'rooted'})
mushroom_data_df['stalk-root'] = mushroom_data_df['stalk-root'].replace({'?': 'missing'})

# stalk-surface-above-ring
mushroom_data_df['stalk-surface-above-ring'] = mushroom_data_df['stalk-surface-above-ring'].replace({'f': 'fibrous'})
mushroom_data_df['stalk-surface-above-ring'] = mushroom_data_df['stalk-surface-above-ring'].replace({'y': 'scaly'})
mushroom_data_df['stalk-surface-above-ring'] = mushroom_data_df['stalk-surface-above-ring'].replace({'k': 'silky'})
mushroom_data_df['stalk-surface-above-ring'] = mushroom_data_df['stalk-surface-above-ring'].replace({'s': 'smooth'})

# stalk-surface-below-ring
mushroom_data_df['stalk-surface-below-ring'] = mushroom_data_df['stalk-surface-below-ring'].replace({'f': 'fibrous'})
mushroom_data_df['stalk-surface-below-ring'] = mushroom_data_df['stalk-surface-below-ring'].replace({'y': 'scaly'})
mushroom_data_df['stalk-surface-below-ring'] = mushroom_data_df['stalk-surface-below-ring'].replace({'k': 'silky'})
mushroom_data_df['stalk-surface-below-ring'] = mushroom_data_df['stalk-surface-below-ring'].replace({'s': 'smooth'})

# stalk color above ring
mushroom_data_df['stalk-color-above-ring'] = mushroom_data_df['stalk-color-above-ring'].replace({'n': 'brown'})
mushroom_data_df['stalk-color-above-ring'] = mushroom_data_df['stalk-color-above-ring'].replace({'b': 'buff'})
mushroom_data_df['stalk-color-above-ring'] = mushroom_data_df['stalk-color-above-ring'].replace({'c': 'cinnamon'})
mushroom_data_df['stalk-color-above-ring'] = mushroom_data_df['stalk-color-above-ring'].replace({'g': 'gray'})
mushroom_data_df['stalk-color-above-ring'] = mushroom_data_df['stalk-color-above-ring'].replace({'o': 'orange'})
mushroom_data_df['stalk-color-above-ring'] = mushroom_data_df['stalk-color-above-ring'].replace({'p': 'pink'})
mushroom_data_df['stalk-color-above-ring'] = mushroom_data_df['stalk-color-above-ring'].replace({'e': 'red'})
mushroom_data_df['stalk-color-above-ring'] = mushroom_data_df['stalk-color-above-ring'].replace({'w': 'white'})
mushroom_data_df['stalk-color-above-ring'] = mushroom_data_df['stalk-color-above-ring'].replace({'y': 'yellow'})

# stalk color below ring
mushroom_data_df['stalk-color-below-ring'] = mushroom_data_df['stalk-color-below-ring'].replace({'n': 'brown'})
mushroom_data_df['stalk-color-below-ring'] = mushroom_data_df['stalk-color-below-ring'].replace({'b': 'buff'})
mushroom_data_df['stalk-color-below-ring'] = mushroom_data_df['stalk-color-below-ring'].replace({'c': 'cinnamon'})
mushroom_data_df['stalk-color-below-ring'] = mushroom_data_df['stalk-color-below-ring'].replace({'g': 'gray'})
mushroom_data_df['stalk-color-below-ring'] = mushroom_data_df['stalk-color-below-ring'].replace({'o': 'orange'})
mushroom_data_df['stalk-color-below-ring'] = mushroom_data_df['stalk-color-below-ring'].replace({'p': 'pink'})
mushroom_data_df['stalk-color-below-ring'] = mushroom_data_df['stalk-color-below-ring'].replace({'e': 'red'})
mushroom_data_df['stalk-color-below-ring'] = mushroom_data_df['stalk-color-below-ring'].replace({'w': 'white'})
mushroom_data_df['stalk-color-below-ring'] = mushroom_data_df['stalk-color-below-ring'].replace({'y': 'yellow'})

# veil-type
mushroom_data_df['veil-type'] = mushroom_data_df['veil-type'].replace({'p': 'partial'})
mushroom_data_df['veil-type'] = mushroom_data_df['veil-type'].replace({'u': 'universal'})

# veil-color
mushroom_data_df['veil-color'] = mushroom_data_df['veil-color'].replace({'n': 'brown'})
mushroom_data_df['veil-color'] = mushroom_data_df['veil-color'].replace({'o': 'orange'})
mushroom_data_df['veil-color'] = mushroom_data_df['veil-color'].replace({'w': 'white'})
mushroom_data_df['veil-color'] = mushroom_data_df['veil-color'].replace({'y': 'yellow'})

## ring-number
mushroom_data_df['ring-number'] = mushroom_data_df['ring-number'].replace({'n': 'none'})
mushroom_data_df['ring-number'] = mushroom_data_df['ring-number'].replace({'o': 'one'})
mushroom_data_df['ring-number'] = mushroom_data_df['ring-number'].replace({'t': 'two'})

# ring-type
mushroom_data_df['ring-type'] = mushroom_data_df['ring-type'].replace({'c': 'cobwebby'})
mushroom_data_df['ring-type'] = mushroom_data_df['ring-type'].replace({'e': 'evanescent'})
mushroom_data_df['ring-type'] = mushroom_data_df['ring-type'].replace({'f': 'flaring'})
mushroom_data_df['ring-type'] = mushroom_data_df['ring-type'].replace({'l': 'large'})
mushroom_data_df['ring-type'] = mushroom_data_df['ring-type'].replace({'n': 'none'})
mushroom_data_df['ring-type'] = mushroom_data_df['ring-type'].replace({'p': 'pendant'})
mushroom_data_df['ring-type'] = mushroom_data_df['ring-type'].replace({'s': 'sheathing'})
mushroom_data_df['ring-type'] = mushroom_data_df['ring-type'].replace({'z': 'zone'})

# spore-print-color
mushroom_data_df['spore-print-color'] = mushroom_data_df['spore-print-color'].replace({'k': 'black'})
mushroom_data_df['spore-print-color'] = mushroom_data_df['spore-print-color'].replace({'n': 'brown'})
mushroom_data_df['spore-print-color'] = mushroom_data_df['spore-print-color'].replace({'b': 'buff'})
mushroom_data_df['spore-print-color'] = mushroom_data_df['spore-print-color'].replace({'h': 'chocolate'})
mushroom_data_df['spore-print-color'] = mushroom_data_df['spore-print-color'].replace({'r': 'green'})
mushroom_data_df['spore-print-color'] = mushroom_data_df['spore-print-color'].replace({'o': 'orange'})
mushroom_data_df['spore-print-color'] = mushroom_data_df['spore-print-color'].replace({'u': 'purple'})
mushroom_data_df['spore-print-color'] = mushroom_data_df['spore-print-color'].replace({'w': 'white'})
mushroom_data_df['spore-print-color'] = mushroom_data_df['spore-print-color'].replace({'y': 'yellow'})

# population
mushroom_data_df['population'] = mushroom_data_df['population'].replace({'a': 'abundant'})
mushroom_data_df['population'] = mushroom_data_df['population'].replace({'c': 'clustered'})
mushroom_data_df['population'] = mushroom_data_df['population'].replace({'n': 'numerous'})
mushroom_data_df['population'] = mushroom_data_df['population'].replace({'s': 'scattered'})
mushroom_data_df['population'] = mushroom_data_df['population'].replace({'v': 'several'})
mushroom_data_df['population'] = mushroom_data_df['population'].replace({'y': 'solitary'})

# habitat
mushroom_data_df['habitat'] = mushroom_data_df['habitat'].replace({'g': 'grasses'})
mushroom_data_df['habitat'] = mushroom_data_df['habitat'].replace({'l': 'leaves'})
mushroom_data_df['habitat'] = mushroom_data_df['habitat'].replace({'m': 'meadows'})
mushroom_data_df['habitat'] = mushroom_data_df['habitat'].replace({'p': 'paths'})
mushroom_data_df['habitat'] = mushroom_data_df['habitat'].replace({'u': 'urban'})
mushroom_data_df['habitat'] = mushroom_data_df['habitat'].replace({'w': 'waste'})
mushroom_data_df['habitat'] = mushroom_data_df['habitat'].replace({'d': 'woods'})

In [25]:
mushroom_data_df.loc['classes']

KeyError: 'classes'