In [3]:
import pandas as pd

# Function to import data from a CSV file
def import_data(file_name):
    try:
        data = pd.read_csv('/content/renewable-energy-stock-account-2007-2022.csv')
        print(f"Data successfully loaded from {file_name}")
        return data
    except FileNotFoundError:
        print("File not found. Please check the file name.")
        return None

# Function to export data to a CSV file
def export_data(data, file_name):
    try:
        data.to_csv(file_name, index=False)
        print(f"Data successfully exported to {file_name}")
    except Exception as e:
        print(f"Error exporting data: {e}")

# Function to show details of the dataset
def show_dataset_details(data):
    if data is not None:
        print("Number of rows and columns:", data.shape)
        print("\nFirst five rows:\n", data.head())
        print("\nSize of the dataset (number of elements):", data.size)
        print("\nNumber of missing values in each column:\n", data.isnull().sum())

        # Handling numerical columns
        numerical_columns = data.select_dtypes(include='number').columns
        if len(numerical_columns) > 0:
            print("\nSummary statistics for numerical columns:")
            print("Sum:\n", data[numerical_columns].sum())
            print("\nAverage:\n", data[numerical_columns].mean())
            print("\nMinimum values:\n", data[numerical_columns].min())
            print("\nMaximum values:\n", data[numerical_columns].max())
        else:
            print("\nNo numerical columns found.")
    else:
        print("Data not available to show details.")

# Main function to run the program
if __name__ == "__main__":
    # Modify the file name to the dataset you want to load
    file_name = 'sample_dataset.csv'

    # Import data
    data = import_data(file_name)

    # Show details of the dataset
    show_dataset_details(data)

    # Export the data to a new CSV file
    export_file_name = 'exported_sample_dataset.csv'
    export_data(data, export_file_name)


Data successfully loaded from sample_dataset.csv
Number of rows and columns: (800, 8)

First five rows:
    year resource        variable           units   magnitude  \
0  2007   Biogas   Closing stock         Dollars   Thousands   
1  2007   Biogas      Generation  Gigawatt hours      Actual   
2  2007   Biogas  Gigawatt hours          Number  Proportion   
3  2007   Biogas   Opening stock         Dollars   Thousands   
4  2007   Biogas   Other changes         Dollars   Thousands   

                   source  data_value flag  
0  Environmental Accounts    64848.00    F  
1                    MBIE      224.00    F  
2                    MBIE        0.01    F  
3  Environmental Accounts         NaN    F  
4  Environmental Accounts         NaN    F  

Size of the dataset (number of elements): 6400

Number of missing values in each column:
 year           0
resource       0
variable       0
units          0
magnitude      0
source         0
data_value    14
flag           0
dtype: int64
