In [None]:
import pandas as pd

# Read the Excel file
df = pd.read_excel("hamREMAX.xlsx")

# Split the 'location' column into three new columns: 'City', 'District', and 'Neighborhood'
df[['İl', 'İlçe', 'Mahalle']] = df['location'].str.split('/', expand=True)

# Remove leading/trailing whitespaces from the new columns
df['İl'] = df['İl'].str.strip()
df['İlçe'] = df['İlçe'].str.strip()
df['Mahalle'] = df['Mahalle'].str.strip()

# Extract 'Fuel Type' and 'Heating Type' from the 'Isıtma' column using regular expressions
df[['Yakıt Tipi', 'Isıtma Türü']] = df['Isıtma'].str.extract(r'(\w+)\s*\((.*?)\)')

# Drop the original 'location' and 'Isıtma' columns as they are no longer needed
df = df.drop(columns=['location', 'Isıtma'])

# Save the cleaned and updated DataFrame to a new CSV file
df.to_csv("duzenlenmis_REMAX.csv", index=False)

# Inform the user that the operation is complete
print("New columns added, old columns removed, and the file was saved as 'duzenlenmis_REMAX.csv'.")

In [None]:

import pandas as pd
df = pd.read_csv("emlakjet_bursa_kiralik_daire_detaylari_new.csv")  # Read the dataset from CSV

# Split the "Konum" column into separate "City", "District", and "Neighborhood" columns
konum_split = df["Konum"].str.split(" - ", expand=True)
df["İl"] = konum_split[0]       # City
df["İlçe"] = konum_split[1]     # District
df["Mahalle"] = konum_split[2]  # Neighborhood

df.drop(columns=["Konum"], inplace=True)  # Drop the original "Konum" column

# Define a function to separate heating type and fuel type
def ayir_isitma_yakit(tip):
    if pd.isna(tip):
        return pd.Series([None, None])
    tip = tip.lower()
    yakitlar = ["doğalgaz", "kat kaloriferi", "fuel oil", "kömür", "elektrik"]
    isitma_tipi = None
    yakit_tipi = None

    # Check if any known fuel type is in the string and extract it
    for yakit in yakitlar:
        if yakit in tip:
            yakit_tipi = yakit.title()  # Capitalize fuel type
            isitma_tipi = tip.replace(yakit, "").strip().title()  # Extract heating type
            break
    if not yakit_tipi:
        isitma_tipi = tip.title()  # If no known fuel type found, use the whole string as heating type
    return pd.Series([isitma_tipi, yakit_tipi])

# Apply the function and create new columns for heating and fuel types
df[["Isıtma Tipi", "Yakıt Tipi"]] = df["Isıtma Tipi"].apply(ayir_isitma_yakit)

output_path = "emlakjet_bursa_kiralik_daire_detaylari_duzenlenmis.csv"
df.to_csv(output_path, index=False)  # Save the updated dataset to a new CSV file

'emlakjet_bursa_kiralik_daire_detaylari_duzenlenmis.csv'

In [None]:
import pandas as pd

# Read the CSV file, skipping any problematic lines
df = pd.read_csv("hepsiemlak_bursa_ilan_detaylari.csv", on_bad_lines='skip')

# Function to split the 'Konum' column into city, district, and neighborhood
def konum_ayir(konum):
    try:
        il, ilce, mahalle = [parca.strip() for parca in konum.split('/')]  # Split by '/' and remove whitespace
        mahalle = mahalle.replace("Mah.", "").strip()  # Remove "Mah." and trim whitespace
        return pd.Series([il, ilce, mahalle])
    except:
        return pd.Series([None, None, None])  # Return None values if an error occurs

# Apply the location splitting function and create new columns
df[['İl', 'İlçe', 'Mahalle']] = df['Konum'].apply(konum_ayir)

# Drop the original 'Konum' column
df = df.drop(columns=['Konum'])

# Preview the first few rows of the modified DataFrame
print(df.head())

# Export the updated data to an Excel file
df.to_excel("konum_ayrilmis_veri.xlsx", index=False)

In [None]:
import pandas as pd

# Read the CSV file containing real estate details
df = pd.read_csv("hepsiemlak_bursa_daire_detaylari_new.csv")

# Extract city, district, and neighborhood from the 'Konum' column using regex
df[['İl', 'İlçe', 'Mahalle']] = df['Konum'].str.extract(r'^(.*?) (.*?) (.*? Mah\.)')

# Remove leading and trailing whitespace from each of the new columns
df['İl'] = df['İl'].str.strip()
df['İlçe'] = df['İlçe'].str.strip()
df['Mahalle'] = df['Mahalle'].str.strip()

# Drop the original 'Konum' column
df = df.drop(columns=['Konum'])

# Save the modified DataFrame to a new CSV file
df.to_csv("hepsiemlak_bursa_daire_detaylari_new_split.csv", index=False)

# Print a confirmation message
print("Konum başarıyla 3 sütuna bölündü ve yeni dosya kaydedildi.")
# (Location was successfully split into 3 columns and the new file was saved.)