In [1]:
# This script demonstrates how to read an Excel file using the pandas library.
# The `read_excel` function is a versatile tool for this task.

# --- Prerequisite: Install the required libraries ---
# You need pandas and an Excel engine like openpyxl.
# Run this command in your terminal if you don't have them installed:
# pip install pandas openpyxl

import pandas as pd
import os

# Create a dummy Excel file for demonstration purposes.
# In a real-world scenario, this file would already exist.
def create_dummy_excel_file():
    """Creates a simple Excel file with two sheets for demonstration."""
    print("Creating 'sample_data.xlsx' for demonstration...")

    # Data for the first sheet
    data_sheet1 = {
        'Name': ['Alice', 'Bob', 'Charlie'],
        'Age': [25, 30, 35],
        'City': ['New York', 'London', 'Paris']
    }
    df1 = pd.DataFrame(data_sheet1)

    # Data for the second sheet
    data_sheet2 = {
        'Product': ['Laptop', 'Mouse', 'Keyboard'],
        'Price': [1200, 25, 75],
        'Stock': [10, 50, 30]
    }
    df2 = pd.DataFrame(data_sheet2)

    with pd.ExcelWriter('sample_data.xlsx') as writer:
        df1.to_excel(writer, sheet_name='Employees', index=False)
        df2.to_excel(writer, sheet_name='Products', index=False)

    print("File 'sample_data.xlsx' created.\n")


# --- Method 1: Reading the first sheet (default behavior) ---
def read_first_sheet():
    """Reads the first sheet of the Excel file into a DataFrame."""
    print("--- Reading the first sheet ('Employees') ---")
    try:
        # The sheet_name parameter is optional; it defaults to the first sheet (index 0).
        df = pd.read_excel('sample_data.xlsx')
        print(df)
    except FileNotFoundError:
        print("Error: The file 'sample_data.xlsx' was not found.")
    print("-" * 40 + "\n")

# --- Method 2: Reading a specific sheet by name ---
def read_sheet_by_name():
    """Reads a specific sheet by its name."""
    print("--- Reading the sheet by name ('Products') ---")
    try:
        df = pd.read_excel('sample_data.xlsx', sheet_name='Products')
        print(df)
    except FileNotFoundError:
        print("Error: The file 'sample_data.xlsx' was not found.")
    print("-" * 40 + "\n")

# --- Method 3: Reading specific columns from a sheet ---
def read_specific_columns():
    """Reads only selected columns from a sheet."""
    print("--- Reading specific columns ('Name' and 'City') ---")
    try:
        # The 'usecols' parameter takes a list of column names or a string.
        df = pd.read_excel('sample_data.xlsx', sheet_name='Employees', usecols=['Name', 'City'])
        print(df)
    except FileNotFoundError:
        print("Error: The file 'sample_data.xlsx' was not found.")
    print("-" * 40 + "\n")


# Main execution block
if __name__ == "__main__":
    # Check if the file exists before creating it, to avoid overwriting.
    if not os.path.exists('sample_data.xlsx'):
        create_dummy_excel_file()

    read_first_sheet()
    read_sheet_by_name()
    read_specific_columns()

Creating 'sample_data.xlsx' for demonstration...
File 'sample_data.xlsx' created.

--- Reading the first sheet ('Employees') ---
      Name  Age      City
0    Alice   25  New York
1      Bob   30    London
2  Charlie   35     Paris
----------------------------------------

--- Reading the sheet by name ('Products') ---
    Product  Price  Stock
0    Laptop   1200     10
1     Mouse     25     50
2  Keyboard     75     30
----------------------------------------

--- Reading specific columns ('Name' and 'City') ---
      Name      City
0    Alice  New York
1      Bob    London
2  Charlie     Paris
----------------------------------------



In [None]:
from google.colab import drive
drive.mount('/content/drive')