In [1]:
import pandas as pd

def normalize_coordinates(coord):
    """
    Normalize a coordinate string by:
    - Removing '°' and direction letters (N, E, S, W)
    - Adding a negative sign for 'S' (South) and 'W' (West)
    """
    # Remove the '°' symbol and strip whitespace
    value, direction = coord.replace("°", "").strip()[:-1], coord.strip()[-1]
    value = float(value)  # Convert to a float
    if direction in ["S", "W"]:
        return -value
    return value

# Read data from file
with open("coord1000.txt", "r", encoding="utf-8") as file:
    lines = [line.strip() for line in file if line.strip()]  # Remove empty lines and strip whitespace

# Parse the data
universities = []
i = 0
while i < len(lines):
    university = lines[i]
    coords = lines[i + 1].split(": ")[1]
    coord1, coord2 = coords.split(", ")
    coord1 = normalize_coordinates(coord1)
    coord2 = normalize_coordinates(coord2)
    universities.append([university, coord1, coord2])  # No website column
    i += 2  # Move to the next block of university data

# Create a DataFrame without the Website column
df = pd.DataFrame(universities, columns=["University", "Latitude", "Longitude"])

# Save to Excel
output_path = "coord1000.xlsx"
df.to_excel(output_path, index=False)
print(f"Data saved to {output_path}")

Data saved to coord1000.xlsx
