
# How to import existing files with Pandas

Complete tutorial accessible via: https://neuraspike.com/blog/how-to-import-existing-files-with-pandas/


In [None]:
import pandas as pd

### How to load and save CSV files in Python with Pandas

In [None]:
# loading to a csv file
url_raw_link = "https://git.io/JL7o9"
daily_female_birth = pd.read_csv(filepath_or_buffer=url_raw_link, sep=",")
daily_female_birth.head()

In [None]:
# writing to a file
filename = "./daily-female-birth.csv"
daily_female_birth.to_csv(path_or_buf=filename, sep=",")

### How to load and save Json Format files in Python with Pandas

In [None]:
nba_players = {
                "Name":{"0":"LeBron James",
                        "1":"Stephen Curry",
                        "2":"James Harden"},

                "Gender":{"0":"Male",
                          "1":"Male",
                          "2":"Male"},

                "Nationality":{"0":"USA",
                                "1":"USA",
                                "2":"USA"}
              }

nba_players_df = pd.DataFrame(data=nba_players)
print(nba_players_df)

# ---------------- output ----------------
#          Name     Gender     Nationality
# 0   LeBron James   Male         USA
# 1  Stephen Curry   Male         USA
# 2   James Harden   Male         USA

In [None]:
filename = "nba_players.json"

# saving the dataframe as a .json format file
nba_players_df.to_json(path_or_buf=filename)

# ---------------- output ----------------
#{
#  "Name": {
#    "0": "LeBron James",
#    "1": "Stephen Curry",
#    "2": "James Harden"
#  },
#  "Gender": {
#    "0": "Male",
#    "1": "Male",
#    "2": "Male"
#  },
#  "Nationality": {
#    "0": "USA",
#    "1": "USA",
#    "2": "USA"
#  }
#}
# Access the link: https://codebeautify.org/jsonviewer -> Click on Beautify

In [None]:
# reading a .json format file
filename = "nba_players.json"
nba_players_df = pd.read_json(path_or_buf=filename)
nba_players_df.head()

### How to load and save Excel files in Python with Pandas

In [None]:
football_players = {
                    "Name":{"0":"Lionel Messi",
                            "1":"Cristiano Ronaldo",
                            "2":"Kylian Mbappé",
                            "3":"Mohamed Salah",
                            "4":"Neymar da Silva Santos Júnior"},

                    "Gender":{"0":"Male",
                              "1":"Male",
                              "2":"Male",
                              "3":"Male",
                              "4":"Male"},

                    "Nationality":{"0":"Argentine",
                                  "1":"Portugal",
                                  "2":"France",
                                  "3":"Egypt",
                                  "4":"Brazil"}
                  }

football_players_df = pd.DataFrame(data=football_players)
print(football_players_df)

# ------------------------ output ----------------------
#                            Name   Gender  Nationality
# 0                   Lionel Messi   Male   Argentina
# 1              Cristiano Ronaldo   Male    Portugal
# 2                  Kylian Mbappé   Male      France
# 3                  Mohamed Salah   Male       Egypt
# 4  Neymar da Silva Santos Júnior   Male      Brazil

In [None]:
file_path = './Football Players.xlsx'
sheet_name = "Football Players"

football_players_df.to_excel(excel_writer=file_path,
                             sheet_name=sheet_name,
                              index=False)

In [None]:
sport_sheets = {
                  'Football Players': football_players_df,
                  'Basketball Players': nba_players_df
                }

filename_path = './Sport men.xlsx'

writer = pd.ExcelWriter(path=filename_path)

# iterate through the sport sheet keys 'Football Players'
# and 'Basketball Players'.
for sheet_name in sport_sheets.keys():

    # save the two dictionaries with different sheet names
    sport_sheets[sheet_name].to_excel(excel_writer=writer,
                                       sheet_name=sheet_name, index=False)

writer.save()

#### How to load specific sheets in Excel

In [None]:
file_path = './Sport men.xlsx'
sheet_name = "Football Players"

football_players_df = pd.read_excel(io=file_path, sheet_name=sheet_name)
print(football_players_df)

# ------------------------ output ----------------------
#                            Name   Gender  Nationality
# 0                   Lionel Messi   Male   Argentina
# 1              Cristiano Ronaldo   Male    Portugal
# 2                  Kylian Mbappé   Male      France
# 3                  Mohamed Salah   Male       Egypt
# 4  Neymar da Silva Santos Júnior   Male      Brazil

In [None]:
sheet_name = "Basketball Players"

nba_players_df = pd.read_excel(io=file_path, sheet_name=sheet_name)
print(nba_players_df)

# ---------------- output ----------------
#          Name     Gender     Nationality
# 0   LeBron James   Male         USA
# 1  Stephen Curry   Male         USA
# 2   James Harden   Male         USA

#### Reading Specific Columns from an Excel File

In [None]:
file_path = './Sport men.xlsx'
sheet_name = "Basketball Players"
columns = [0, 2] # name & nationality

nba_players_df = pd.read_excel(io=file_path, sheet_name=sheet_name,
                                usecols=columns)
print(nba_players_df)

# ---------------- output ----------------
#          Name        Nationality
# 0   LeBron James         USA
# 1   Stephen Curry        USA
# 2   James Harden         USA


In [None]:
file_path = './Sport men.xlsx'
sheet_name = "Basketball Players"
columns = [0, 2] # name & nationality

nba_players_df = pd.read_excel(io=file_path, sheet_name=sheet_name,
                                usecols=columns)
print(nba_players_df)

# ---------------- output ----------------
#          Name        Nationality
# 0   LeBron James         USA
# 1   Stephen Curry        USA
# 2   James Harden         USA

#### How to load specific sheets in Excel

In [None]:
file_path = './Sport men.xlsx'
sheet_name = "Football Players"

football_players_df = pd.read_excel(io=file_path, sheet_name=sheet_name)
print(football_players_df)

# ------------------------ output ----------------------
#                            Name   Gender  Nationality
# 0                   Lionel Messi   Male   Argentina
# 1              Cristiano Ronaldo   Male    Portugal
# 2                  Kylian Mbappé   Male      France
# 3                  Mohamed Salah   Male       Egypt
# 4  Neymar da Silva Santos Júnior   Male      Brazil

In [None]:
sheet_name = "Basketball Players"

nba_players_df = pd.read_excel(io=file_path, sheet_name=sheet_name)
print(nba_players_df)

# ---------------- output ----------------
#          Name     Gender     Nationality
# 0   LeBron James   Male         USA
# 1  Stephen Curry   Male         USA
# 2   James Harden   Male         USA

#### Reading Specific Columns from an Excel File

In [None]:
file_path = './Sport men.xlsx'
sheet_name = "Basketball Players"
columns = [0, 2] # name & nationality

nba_players_df = pd.read_excel(io=file_path, sheet_name=sheet_name,
                                usecols=columns)
print(nba_players_df)

# ---------------- output ----------------
#          Name        Nationality
# 0   LeBron James         USA
# 1   Stephen Curry        USA
# 2   James Harden         USA