In [37]:
import pandas as pd
import numpy as np
import csv
import warnings

pd.set_option('display.max_rows', None)
pd.set_option('display.max_columns', None)

warnings.filterwarnings('ignore')

In [38]:
# Reduces Memory used on your computer. 
# Helpful when your data is large it reduces the memory used 
# so your script/notebook doesn't crash with out of memory errors
def reduce_mem_usage(df, verbose=True):
    numerics = ['int16', 'int32', 'int64', 'float16', 'float32', 'float64']
    start_mem = df.memory_usage().sum() / 1024**2    
    for col in df.columns:
        col_type = df[col].dtypes
        if col_type in numerics:
            c_min = df[col].min()
            c_max = df[col].max()
            if str(col_type)[:3] == 'int':
                if c_min > np.iinfo(np.int8).min and c_max < np.iinfo(np.int8).max:
                    df[col] = df[col].astype(np.int8)
                elif c_min > np.iinfo(np.int16).min and c_max < np.iinfo(np.int16).max:
                    df[col] = df[col].astype(np.int16)
                elif c_min > np.iinfo(np.int32).min and c_max < np.iinfo(np.int32).max:
                    df[col] = df[col].astype(np.int32)
                elif c_min > np.iinfo(np.int64).min and c_max < np.iinfo(np.int64).max:
                    df[col] = df[col].astype(np.int64)  
            else:
                if c_min > np.finfo(np.float16).min and c_max < np.finfo(np.float16).max:
                    df[col] = df[col].astype(np.float16)
                elif c_min > np.finfo(np.float32).min and c_max < np.finfo(np.float32).max:
                    df[col] = df[col].astype(np.float32)
                else:
                    df[col] = df[col].astype(np.float64)    
    end_mem = df.memory_usage().sum() / 1024**2
    if verbose: print('Mem. usage decreased to {:5.2f} Mb ({:.1f}% reduction)'.format(end_mem, 100 * (start_mem - end_mem) / start_mem))
    return df

In [39]:
UncleanData = pd.read_csv('Assignment1Data_Sample.csv')
UncleanData = reduce_mem_usage(UncleanData)

Mem. usage decreased to  0.06 Mb (4.9% reduction)


In [40]:
UncleanData.head()

Unnamed: 0,Object Number,Object ID,Department,Object Name,Title,Culture,Period,Dynasty,Reign,Portfolio,Artist Role,Artist Prefix,Artist Display Name,Artist Display Bio,Artist Suffix,Artist Nationality,Artist Begin Date,Artist End Date,Object Date,Object Begin Date,Object End Date,Medium,Dimensions,Credit Line,Geography Type,City,State,County,Country,Region,Subregion,Locale,Locus,Excavation,River,Classification,Rights and Reproduction,Link Resource,Metadata Date,Repository,Tags
0,62.16,1674,American Decorative Arts,Side Chair,Side Chair,American,,,,,Maker,Attributed to,Samuel McIntire,1757–1811,,,1757.0,1811.0,1794–99,1794,1799.0,"Mahogany, ebony, ash, birch, white pine",37 7/8 x 27 7/8 x 18 in. (96.2 x 70.8 x 45.7 cm),"Friends of the American Wing Fund, 1962",Made in,Salem,,,United States,,,,,,,Furniture,,http://www.metmuseum.org/art/collection/search...,5/13/2019 8:00,"Metropolitan Museum of Art, New York, NY",Chairs
1,13.7.17,2430,American Decorative Arts,Pitcher,Covered Pitcher,American,,,,,,,,,,,,,1700–1900,1700,1900.0,Earthenware,7 1/4 x 6 3/8 x 5 1/2 in. (18.4 x 16.2 x 14 cm),"Rogers Fund, 1913",Made in,,,,United States,,,,,,,Ceramics,,http://www.metmuseum.org/art/collection/search...,5/13/2019 8:00,"Metropolitan Museum of Art, New York, NY",Pitchers
2,33.85.11,6406,American Decorative Arts,Plate,Plate,Dutch,,,,,,,,,,,,,1740–60,1740,1760.0,Earthenware,Diam. 8 7/8 in. (22.5 cm),"Rogers Fund, 1933",Made in,Delft,,,Netherlands,,,,,,,Ceramics,,http://www.metmuseum.org/art/collection/search...,5/13/2019 8:00,"Metropolitan Museum of Art, New York, NY",
3,69.194.109,7616,American Decorative Arts,Soup bowl,Soup Bowl,American,,,,,Maker,,Union Porcelain Works,1863–ca. 1922,,,1863.0,1922.0,1885,1885,1885.0,Porcelain,H. 1 7/16 in. (3.7 cm); Diam. 8 3/4 in. (22.2 cm),"Gift of Mr. and Mrs. Franklin Chace, 1969",Made in,Brooklyn,,,United States,,,,,,,Ceramics,,http://www.metmuseum.org/art/collection/search...,5/13/2019 8:00,"Metropolitan Museum of Art, New York, NY",Bowls
4,2006.235.20,15012,American Decorative Arts,"Painting, miniature",Portrait of a Lady,American,,,,,Artist,,John Henry Brown,1818–1891,,,1818.0,1891.0,ca. 1840,1840,1840.0,Watercolor on ivory,2 11/16 x 2 3/16 in. (6.8 x 5.6 cm),"Fletcher Fund, 2006",,,,,,,,,,,,Paintings,,http://www.metmuseum.org/art/collection/search...,5/13/2019 8:00,"Metropolitan Museum of Art, New York, NY",Pendants|Portraits|Women


In [41]:
# Number of records in your dataset
len(UncleanData)

204

In [42]:
UncleanData.describe()

Unnamed: 0,Object ID,Object Begin Date,Object End Date
count,204.0,204.0,202.0
mean,393179.387255,1293.377451,inf
std,230139.277682,1337.679724,inf
min,1674.0,-7000.0,-5000.0
25%,216475.0,1566.0,1600.0
50%,378235.5,1800.0,1870.0
75%,624197.5,1910.0,1935.0
max,824428.0,2003.0,2004.0


In [43]:
#Selecting the prefered columns
CleanData = UncleanData[['Object ID', 'Department', 'Object Name', 'Title', 'Culture', 'Artist Nationality', 'Object Begin Date', 'Object End Date', 'Medium', 'Credit Line', 'Country']]
CleanData

Unnamed: 0,Object ID,Department,Object Name,Title,Culture,Artist Nationality,Object Begin Date,Object End Date,Medium,Credit Line,Country
0,1674,American Decorative Arts,Side Chair,Side Chair,American,,1794,1799.0,"Mahogany, ebony, ash, birch, white pine","Friends of the American Wing Fund, 1962",United States
1,2430,American Decorative Arts,Pitcher,Covered Pitcher,American,,1700,1900.0,Earthenware,"Rogers Fund, 1913",United States
2,6406,American Decorative Arts,Plate,Plate,Dutch,,1740,1760.0,Earthenware,"Rogers Fund, 1933",Netherlands
3,7616,American Decorative Arts,Soup bowl,Soup Bowl,American,,1885,1885.0,Porcelain,"Gift of Mr. and Mrs. Franklin Chace, 1969",United States
4,15012,American Decorative Arts,"Painting, miniature",Portrait of a Lady,American,,1840,1840.0,Watercolor on ivory,"Fletcher Fund, 2006",
5,23510,Arms and Armor,Arrowhead (Yanonē),Arrowhead (Yanonē),Japanese,,1701,1800.0,Steel,"The Collection of Giovanni P. Morosini, presen...",
6,29920,Arms and Armor,Knife handle (Kozuka),Knife Handle (Kozuka),Japanese,,1770,1852.0,"Copper-gold alloy (shakudō), copper-silver all...","The Howard Mansfield Collection, Gift of Howar...",
7,32848,Arms and Armor,Coin (Thaler),Coin (Thaler) Showing August I (The Pious) of ...,German,,1580,1580.0,Silver,"Gift of Bashford Dean, 1923",
8,34014,Arms and Armor,Two drawings,Drawings Showing Combat on Foot (Champ Clos),German,,1501,1600.0,"Pen, ink and watercolor on paper","Bashford Dean Memorial Collection, Funds from ...",
9,34308,Arms and Armor,Partisan,Partisan,German,,1701,1800.0,"Steel, wood, textile, metallic thread","Bashford Dean Memorial Collection, Gift of Edw...",


In [44]:
CleanData.columns

Index(['Object ID', 'Department', 'Object Name', 'Title', 'Culture',
       'Artist Nationality', 'Object Begin Date', 'Object End Date', 'Medium',
       'Credit Line', 'Country'],
      dtype='object')

In [45]:
# What is your data type?]
CleanData.dtypes

Object ID               int32
Department             object
Object Name            object
Title                  object
Culture                object
Artist Nationality     object
Object Begin Date       int16
Object End Date       float16
Medium                 object
Credit Line            object
Country                object
dtype: object

In [46]:
# Check the format
CleanData.info()


<class 'pandas.core.frame.DataFrame'>
RangeIndex: 204 entries, 0 to 203
Data columns (total 11 columns):
 #   Column              Non-Null Count  Dtype  
---  ------              --------------  -----  
 0   Object ID           204 non-null    int32  
 1   Department          203 non-null    object 
 2   Object Name         203 non-null    object 
 3   Title               194 non-null    object 
 4   Culture             84 non-null     object 
 5   Artist Nationality  87 non-null     object 
 6   Object Begin Date   204 non-null    int16  
 7   Object End Date     202 non-null    float16
 8   Medium              202 non-null    object 
 9   Credit Line         204 non-null    object 
 10  Country             32 non-null     object 
dtypes: float16(1), int16(1), int32(1), object(8)
memory usage: 14.5+ KB


In [47]:
#numbers of missing rows in a collumn
df = CleanData
df.isna().sum()

Object ID               0
Department              1
Object Name             1
Title                  10
Culture               120
Artist Nationality    117
Object Begin Date       0
Object End Date         2
Medium                  2
Credit Line             0
Country               172
dtype: int64

In [48]:
#replacing missing values of numeric rolls with its column mean value
df.fillna(df.mean())

Unnamed: 0,Object ID,Department,Object Name,Title,Culture,Artist Nationality,Object Begin Date,Object End Date,Medium,Credit Line,Country
0,1674,American Decorative Arts,Side Chair,Side Chair,American,,1794,1799.0,"Mahogany, ebony, ash, birch, white pine","Friends of the American Wing Fund, 1962",United States
1,2430,American Decorative Arts,Pitcher,Covered Pitcher,American,,1700,1900.0,Earthenware,"Rogers Fund, 1913",United States
2,6406,American Decorative Arts,Plate,Plate,Dutch,,1740,1760.0,Earthenware,"Rogers Fund, 1933",Netherlands
3,7616,American Decorative Arts,Soup bowl,Soup Bowl,American,,1885,1885.0,Porcelain,"Gift of Mr. and Mrs. Franklin Chace, 1969",United States
4,15012,American Decorative Arts,"Painting, miniature",Portrait of a Lady,American,,1840,1840.0,Watercolor on ivory,"Fletcher Fund, 2006",
5,23510,Arms and Armor,Arrowhead (Yanonē),Arrowhead (Yanonē),Japanese,,1701,1800.0,Steel,"The Collection of Giovanni P. Morosini, presen...",
6,29920,Arms and Armor,Knife handle (Kozuka),Knife Handle (Kozuka),Japanese,,1770,1852.0,"Copper-gold alloy (shakudō), copper-silver all...","The Howard Mansfield Collection, Gift of Howar...",
7,32848,Arms and Armor,Coin (Thaler),Coin (Thaler) Showing August I (The Pious) of ...,German,,1580,1580.0,Silver,"Gift of Bashford Dean, 1923",
8,34014,Arms and Armor,Two drawings,Drawings Showing Combat on Foot (Champ Clos),German,,1501,1600.0,"Pen, ink and watercolor on paper","Bashford Dean Memorial Collection, Funds from ...",
9,34308,Arms and Armor,Partisan,Partisan,German,,1701,1800.0,"Steel, wood, textile, metallic thread","Bashford Dean Memorial Collection, Gift of Edw...",


In [49]:
# Dropping or removing some NaN rows
#indexes_to_drop = df.loc[ (df['Title'].isna())].index
indexes_to_drop = df.loc[ (df['Culture'].isna())].index
#indexes_to_drop = df.loc[ (df['Artist Nationality'].isna())].index
#indexes_to_drop = df.loc[ (df['Object End Date'].isna())].index
#indexes_to_drop = df.loc[ (df['Country'].isna())].index



  
# drop these given row indexes from dataFrame 
Dropped = df.drop(indexes_to_drop)

In [50]:
#Show us the number of rolls after removing the missing rolls
print('Before dropping: ',len(df))
print('After dropping: ',len(Dropped))

Before dropping:  204
After dropping:  84


In [51]:
Dropped

Unnamed: 0,Object ID,Department,Object Name,Title,Culture,Artist Nationality,Object Begin Date,Object End Date,Medium,Credit Line,Country
0,1674,American Decorative Arts,Side Chair,Side Chair,American,,1794,1799.0,"Mahogany, ebony, ash, birch, white pine","Friends of the American Wing Fund, 1962",United States
1,2430,American Decorative Arts,Pitcher,Covered Pitcher,American,,1700,1900.0,Earthenware,"Rogers Fund, 1913",United States
2,6406,American Decorative Arts,Plate,Plate,Dutch,,1740,1760.0,Earthenware,"Rogers Fund, 1933",Netherlands
3,7616,American Decorative Arts,Soup bowl,Soup Bowl,American,,1885,1885.0,Porcelain,"Gift of Mr. and Mrs. Franklin Chace, 1969",United States
4,15012,American Decorative Arts,"Painting, miniature",Portrait of a Lady,American,,1840,1840.0,Watercolor on ivory,"Fletcher Fund, 2006",
5,23510,Arms and Armor,Arrowhead (Yanonē),Arrowhead (Yanonē),Japanese,,1701,1800.0,Steel,"The Collection of Giovanni P. Morosini, presen...",
6,29920,Arms and Armor,Knife handle (Kozuka),Knife Handle (Kozuka),Japanese,,1770,1852.0,"Copper-gold alloy (shakudō), copper-silver all...","The Howard Mansfield Collection, Gift of Howar...",
7,32848,Arms and Armor,Coin (Thaler),Coin (Thaler) Showing August I (The Pious) of ...,German,,1580,1580.0,Silver,"Gift of Bashford Dean, 1923",
8,34014,Arms and Armor,Two drawings,Drawings Showing Combat on Foot (Champ Clos),German,,1501,1600.0,"Pen, ink and watercolor on paper","Bashford Dean Memorial Collection, Funds from ...",
9,34308,Arms and Armor,Partisan,Partisan,German,,1701,1800.0,"Steel, wood, textile, metallic thread","Bashford Dean Memorial Collection, Gift of Edw...",


In [52]:
indexes_to_drop2 = Dropped.loc[ (df['Title'].isna())].index



  
# drop these given row indexes from dataFrame 
Dropped = Dropped.drop(indexes_to_drop2)

In [53]:
#Show us the number of rolls after removing the missing rolls
print('Before dropping: ',len(df))
print('After dropping: ',len(Dropped))

Before dropping:  204
After dropping:  74


In [54]:
Dropped

Unnamed: 0,Object ID,Department,Object Name,Title,Culture,Artist Nationality,Object Begin Date,Object End Date,Medium,Credit Line,Country
0,1674,American Decorative Arts,Side Chair,Side Chair,American,,1794,1799.0,"Mahogany, ebony, ash, birch, white pine","Friends of the American Wing Fund, 1962",United States
1,2430,American Decorative Arts,Pitcher,Covered Pitcher,American,,1700,1900.0,Earthenware,"Rogers Fund, 1913",United States
2,6406,American Decorative Arts,Plate,Plate,Dutch,,1740,1760.0,Earthenware,"Rogers Fund, 1933",Netherlands
3,7616,American Decorative Arts,Soup bowl,Soup Bowl,American,,1885,1885.0,Porcelain,"Gift of Mr. and Mrs. Franklin Chace, 1969",United States
4,15012,American Decorative Arts,"Painting, miniature",Portrait of a Lady,American,,1840,1840.0,Watercolor on ivory,"Fletcher Fund, 2006",
5,23510,Arms and Armor,Arrowhead (Yanonē),Arrowhead (Yanonē),Japanese,,1701,1800.0,Steel,"The Collection of Giovanni P. Morosini, presen...",
6,29920,Arms and Armor,Knife handle (Kozuka),Knife Handle (Kozuka),Japanese,,1770,1852.0,"Copper-gold alloy (shakudō), copper-silver all...","The Howard Mansfield Collection, Gift of Howar...",
7,32848,Arms and Armor,Coin (Thaler),Coin (Thaler) Showing August I (The Pious) of ...,German,,1580,1580.0,Silver,"Gift of Bashford Dean, 1923",
8,34014,Arms and Armor,Two drawings,Drawings Showing Combat on Foot (Champ Clos),German,,1501,1600.0,"Pen, ink and watercolor on paper","Bashford Dean Memorial Collection, Funds from ...",
9,34308,Arms and Armor,Partisan,Partisan,German,,1701,1800.0,"Steel, wood, textile, metallic thread","Bashford Dean Memorial Collection, Gift of Edw...",


In [55]:
#Change object end date to int
# Converting selected columns to string
Dropped[['Object End Date']] = Dropped[['Object End Date']].astype(int)

In [56]:
#adjusting the values in Object End Date 

sorted(Dropped['Object End Date'].unique())


[-3100,
 -2000,
 -1450,
 -501,
 -475,
 -450,
 -400,
 -300,
 -275,
 400,
 800,
 1150,
 1270,
 1275,
 1299,
 1520,
 1580,
 1600,
 1699,
 1750,
 1760,
 1765,
 1780,
 1799,
 1800,
 1815,
 1840,
 1850,
 1852,
 1872,
 1885,
 1899,
 1900,
 1939,
 1943,
 1949,
 1950,
 1959,
 1966,
 1967,
 1980,
 1984,
 1987,
 1989,
 2000,
 2004]

In [57]:
#Let's split some values with comma in culture 
#Starting from Culture we can see that there are some null values and we would like to remove these rows
df = Dropped.copy()
df = df.dropna(subset=['Culture'], how='all')
df

Unnamed: 0,Object ID,Department,Object Name,Title,Culture,Artist Nationality,Object Begin Date,Object End Date,Medium,Credit Line,Country
0,1674,American Decorative Arts,Side Chair,Side Chair,American,,1794,1799,"Mahogany, ebony, ash, birch, white pine","Friends of the American Wing Fund, 1962",United States
1,2430,American Decorative Arts,Pitcher,Covered Pitcher,American,,1700,1900,Earthenware,"Rogers Fund, 1913",United States
2,6406,American Decorative Arts,Plate,Plate,Dutch,,1740,1760,Earthenware,"Rogers Fund, 1933",Netherlands
3,7616,American Decorative Arts,Soup bowl,Soup Bowl,American,,1885,1885,Porcelain,"Gift of Mr. and Mrs. Franklin Chace, 1969",United States
4,15012,American Decorative Arts,"Painting, miniature",Portrait of a Lady,American,,1840,1840,Watercolor on ivory,"Fletcher Fund, 2006",
5,23510,Arms and Armor,Arrowhead (Yanonē),Arrowhead (Yanonē),Japanese,,1701,1800,Steel,"The Collection of Giovanni P. Morosini, presen...",
6,29920,Arms and Armor,Knife handle (Kozuka),Knife Handle (Kozuka),Japanese,,1770,1852,"Copper-gold alloy (shakudō), copper-silver all...","The Howard Mansfield Collection, Gift of Howar...",
7,32848,Arms and Armor,Coin (Thaler),Coin (Thaler) Showing August I (The Pious) of ...,German,,1580,1580,Silver,"Gift of Bashford Dean, 1923",
8,34014,Arms and Armor,Two drawings,Drawings Showing Combat on Foot (Champ Clos),German,,1501,1600,"Pen, ink and watercolor on paper","Bashford Dean Memorial Collection, Funds from ...",
9,34308,Arms and Armor,Partisan,Partisan,German,,1701,1800,"Steel, wood, textile, metallic thread","Bashford Dean Memorial Collection, Gift of Edw...",


In [58]:
sorted(df.Culture.unique())

['Abelam people',
 'American',
 'Asmat people',
 'Atlantic Watershed',
 'Aztec',
 'British',
 'British, Chelsea',
 'British, Stoke-on-Trent, Staffordshire',
 'Byzantine',
 'Catalan',
 'China',
 'Cypriot',
 'Dutch',
 'European',
 'European or Middle Eastern',
 'European, Eastern',
 'French',
 'German',
 'German, Hanau',
 'German, Silesia (Bunzlau)',
 'Greek, Attic',
 'Iran',
 'Italian',
 'Italian, Venice',
 'Italic',
 'Japanese',
 'Mexican',
 'Minoan',
 'Minoan, Crete',
 'Quechua',
 'Romanian',
 'South Netherlandish',
 'Spanish',
 'Timor',
 'possibly Greek',
 'possibly Spanish',
 'probably French',
 'probably German']

In [63]:
#Add "Missing" to NaN values in the columns or rows Artist Nationality

df['Artist Nationality'] = df['Artist Nationality'].fillna('Missing Values')
df['Department'] = df['Department'].fillna('Missing Values')
df['Country'] = df['Country'].fillna('Missing Values')
df

Unnamed: 0,Object ID,Department,Object Name,Title,Culture,Artist Nationality,Object Begin Date,Object End Date,Medium,Credit Line,Country
0,1674,American Decorative Arts,Side Chair,Side Chair,American,Missing Values,1794,1799,"Mahogany, ebony, ash, birch, white pine","Friends of the American Wing Fund, 1962",United States
1,2430,American Decorative Arts,Pitcher,Covered Pitcher,American,Missing Values,1700,1900,Earthenware,"Rogers Fund, 1913",United States
2,6406,American Decorative Arts,Plate,Plate,Dutch,Missing Values,1740,1760,Earthenware,"Rogers Fund, 1933",Netherlands
3,7616,American Decorative Arts,Soup bowl,Soup Bowl,American,Missing Values,1885,1885,Porcelain,"Gift of Mr. and Mrs. Franklin Chace, 1969",United States
4,15012,American Decorative Arts,"Painting, miniature",Portrait of a Lady,American,Missing Values,1840,1840,Watercolor on ivory,"Fletcher Fund, 2006",Missing Values
5,23510,Arms and Armor,Arrowhead (Yanonē),Arrowhead (Yanonē),Japanese,Missing Values,1701,1800,Steel,"The Collection of Giovanni P. Morosini, presen...",Missing Values
6,29920,Arms and Armor,Knife handle (Kozuka),Knife Handle (Kozuka),Japanese,Missing Values,1770,1852,"Copper-gold alloy (shakudō), copper-silver all...","The Howard Mansfield Collection, Gift of Howar...",Missing Values
7,32848,Arms and Armor,Coin (Thaler),Coin (Thaler) Showing August I (The Pious) of ...,German,Missing Values,1580,1580,Silver,"Gift of Bashford Dean, 1923",Missing Values
8,34014,Arms and Armor,Two drawings,Drawings Showing Combat on Foot (Champ Clos),German,Missing Values,1501,1600,"Pen, ink and watercolor on paper","Bashford Dean Memorial Collection, Funds from ...",Missing Values
9,34308,Arms and Armor,Partisan,Partisan,German,Missing Values,1701,1800,"Steel, wood, textile, metallic thread","Bashford Dean Memorial Collection, Gift of Edw...",Missing Values


In [64]:
# Manually replacing incorrect values
df['Country'] = df['Country'].str.replace("present-day France","France")

In [65]:
#sorted(df.Country.unique())
df

Unnamed: 0,Object ID,Department,Object Name,Title,Culture,Artist Nationality,Object Begin Date,Object End Date,Medium,Credit Line,Country
0,1674,American Decorative Arts,Side Chair,Side Chair,American,Missing Values,1794,1799,"Mahogany, ebony, ash, birch, white pine","Friends of the American Wing Fund, 1962",United States
1,2430,American Decorative Arts,Pitcher,Covered Pitcher,American,Missing Values,1700,1900,Earthenware,"Rogers Fund, 1913",United States
2,6406,American Decorative Arts,Plate,Plate,Dutch,Missing Values,1740,1760,Earthenware,"Rogers Fund, 1933",Netherlands
3,7616,American Decorative Arts,Soup bowl,Soup Bowl,American,Missing Values,1885,1885,Porcelain,"Gift of Mr. and Mrs. Franklin Chace, 1969",United States
4,15012,American Decorative Arts,"Painting, miniature",Portrait of a Lady,American,Missing Values,1840,1840,Watercolor on ivory,"Fletcher Fund, 2006",Missing Values
5,23510,Arms and Armor,Arrowhead (Yanonē),Arrowhead (Yanonē),Japanese,Missing Values,1701,1800,Steel,"The Collection of Giovanni P. Morosini, presen...",Missing Values
6,29920,Arms and Armor,Knife handle (Kozuka),Knife Handle (Kozuka),Japanese,Missing Values,1770,1852,"Copper-gold alloy (shakudō), copper-silver all...","The Howard Mansfield Collection, Gift of Howar...",Missing Values
7,32848,Arms and Armor,Coin (Thaler),Coin (Thaler) Showing August I (The Pious) of ...,German,Missing Values,1580,1580,Silver,"Gift of Bashford Dean, 1923",Missing Values
8,34014,Arms and Armor,Two drawings,Drawings Showing Combat on Foot (Champ Clos),German,Missing Values,1501,1600,"Pen, ink and watercolor on paper","Bashford Dean Memorial Collection, Funds from ...",Missing Values
9,34308,Arms and Armor,Partisan,Partisan,German,Missing Values,1701,1800,"Steel, wood, textile, metallic thread","Bashford Dean Memorial Collection, Gift of Edw...",Missing Values


In [66]:
#Remove duplicate rows inplace
df.drop_duplicates()
df

Unnamed: 0,Object ID,Department,Object Name,Title,Culture,Artist Nationality,Object Begin Date,Object End Date,Medium,Credit Line,Country
0,1674,American Decorative Arts,Side Chair,Side Chair,American,Missing Values,1794,1799,"Mahogany, ebony, ash, birch, white pine","Friends of the American Wing Fund, 1962",United States
1,2430,American Decorative Arts,Pitcher,Covered Pitcher,American,Missing Values,1700,1900,Earthenware,"Rogers Fund, 1913",United States
2,6406,American Decorative Arts,Plate,Plate,Dutch,Missing Values,1740,1760,Earthenware,"Rogers Fund, 1933",Netherlands
3,7616,American Decorative Arts,Soup bowl,Soup Bowl,American,Missing Values,1885,1885,Porcelain,"Gift of Mr. and Mrs. Franklin Chace, 1969",United States
4,15012,American Decorative Arts,"Painting, miniature",Portrait of a Lady,American,Missing Values,1840,1840,Watercolor on ivory,"Fletcher Fund, 2006",Missing Values
5,23510,Arms and Armor,Arrowhead (Yanonē),Arrowhead (Yanonē),Japanese,Missing Values,1701,1800,Steel,"The Collection of Giovanni P. Morosini, presen...",Missing Values
6,29920,Arms and Armor,Knife handle (Kozuka),Knife Handle (Kozuka),Japanese,Missing Values,1770,1852,"Copper-gold alloy (shakudō), copper-silver all...","The Howard Mansfield Collection, Gift of Howar...",Missing Values
7,32848,Arms and Armor,Coin (Thaler),Coin (Thaler) Showing August I (The Pious) of ...,German,Missing Values,1580,1580,Silver,"Gift of Bashford Dean, 1923",Missing Values
8,34014,Arms and Armor,Two drawings,Drawings Showing Combat on Foot (Champ Clos),German,Missing Values,1501,1600,"Pen, ink and watercolor on paper","Bashford Dean Memorial Collection, Funds from ...",Missing Values
9,34308,Arms and Armor,Partisan,Partisan,German,Missing Values,1701,1800,"Steel, wood, textile, metallic thread","Bashford Dean Memorial Collection, Gift of Edw...",Missing Values


In [154]:
#Exporting my Final Data
df.to_csv(r'CleanDataAss1.csv')