# Import XLSX (Excel)

In [None]:
import time
import pandas as pd
from helpers.helper_functions import init_connection, excel_import

# set up timer for runtime of the script
start_time = time.time()

# run the initialization notebook to connect to the neo4j database
graph = init_connection()

### Import to Excel

This block defines the source path for the Excel file that contains the data to be imported into the Neo4j knowledge graph. It uses pandas.ExcelFile() to load the workbook located at ../data/import/import_data.xlsx. Once the file is loaded, it calls the excel_import() function, passing in the Excel file and the active Neo4j graph connection. The function handles reading the contents of the Excel sheets and creating the corresponding nodes and relationships in the database. This step is essential for populating the graph with new data from external sources.

In [None]:
# define source file path
excel_file = pd.ExcelFile("../data/import/import_data.xlsx")

# call the import function with the specified parameters
excel_import(excel_file=excel_file, graph=graph)

### Timestamp
This block prints the timestamp indicating when the script was executed and displays the total runtime. It uses `time.strftime()` to format the current date and time in the `dd.mm.yyyy hh:mm:ss` format. Then it calculates the total execution time by subtracting the recorded start time from the current time. Finally, it prints the total runtime in seconds, giving the user insight into how long the entire knowledge graph generation process took to complete.

In [None]:
# print statement to print when the script was executed
print(f"This script was run on: {time.strftime("%d.%m.%Y %H:%M:%S")}")

# stop the runtime timer
end_time = time.time()

# calculate the total execution time
total_time = end_time - start_time

# print the total execution time
print(f"Total execution time: {total_time:.2f} seconds")