In [1]:
import pandas as pd

def drop_duplicates(csv_file):
    """
    This function takes a csv file containing pole studios information,
    combines it with another csv containing URLs for pole studios, and
    removes any duplicate rows from the resulting merged dataframe.
    :param csv_file: The csv file containing the pole studios information.
    :return: A dataframe with no duplicate rows.
    """
    # Load the csv files
    all_polestudios_ger = pd.read_csv(csv_file)
    all_polestudios_ger_urls = pd.read_csv("all_pole_studios_germany_cl.csv")
    
    # Extract the 'Business Name' and 'Studio Workshop Url: SW' columns from all_polestudios_ger_urls
    url_mapping = all_polestudios_ger_urls.loc[:, ['Business Name', 'Studio Workshop Url: SW']]
    
    # Merge all_polestudios_ger with url_mapping on the 'Business Name' column
    merged_df = pd.merge(all_polestudios_ger, url_mapping, on='Business Name', how='outer')
    
    # Drop any duplicate rows based on the 'Business Name' column
    merged_df = merged_df.drop_duplicates(subset='Business Name')
    
    # Reset the index of the resulting dataframe
    merged_df = merged_df.reset_index(drop=True)
    
    # Return the resulting dataframe
    return merged_df
    merged_df

In [2]:
df = drop_duplicates("all_pole_studios_germany.csv")
df


Unnamed: 0,City,Image Source,Business Name,Rating,Number of Reviews,Categories,Address,Studio Workshop Url: SW
0,Aachen,https://files.eversports.com/b5fbdb8d-cc1e-44a...,poda Studio,rating,"4,9 (47 Rezensionen)","['Fitness', 'Tanzen', 'Yoga', 'Poledance', '+ ...","Martinstraße 10-12 , 52062 Aachen",https://www.eversports.de/sw/poda-studio
1,Aachen,https://files.eversports.com/0aed1787-d224-486...,Pura Studio,rating,5 (60 Rezensionen),"['Yoga', 'Poledance', 'Massage', 'Stretching',...","Schaufenberger Straße 61 , 52477 Alsdorf",https://www.eversports.de/sw/pura-studio
2,Abensberg,https://files.eversports.com/a73d40e1-eaf2-430...,Polesition Regensburg,rating,"4,9 (27 Rezensionen)","['Pilates', 'Tanzen', 'Poledance', 'Aerial Yog...","Rebhuhnstraße 4, 93326 Abensberg",https://www.eversports.de/sw/polesition-regens...
3,Abensberg,https://files.eversports.com/9b5f6e3a-5ec8-45f...,Sportheim Abensberg,rating,"4,9 (36 Rezensionen)","['Fitness', 'Pilates', 'Poledance', 'Aerial Yo...","Von-Hazzi-Straße 7, 93326 Abensberg",https://www.eversports.de/sw/sportheim-abensberg
4,Achern,https://files.eversports.com/0fe3af8e-230c-4d1...,Körperformfabrik GbR,rating,"4,9 (3 Rezensionen)","['Poledance', 'TRX®', 'TRX® Yoga', 'TRX® Suspe...","Hauptstraße 108 , 77855 Achern",https://www.eversports.de/sw/körperformfabrik-gbr
...,...,...,...,...,...,...,...,...
126,Rheinfelden,https://files.eversports.com/ada68e9c-7bfc-4ce...,Dayuma - Pole & Acrobatics,rating,5 (21 Rezensionen),"['Poledance', 'Akrobatik', 'Acroyoga', 'Stretc...","Auf dem Wolf 18 , 4052 Basel",https://www.eversports.de/sw/dayuma---pole-&-a...
127,Rheinfelden,https://files.eversports.com/596619e4-9146-413...,LOFT1 BASEL CITY,rating,"4,7 (27 Rezensionen)","['Fitness', 'Poledance']","Centralbahnplatz 10 , 4051 Basel",https://www.eversports.de/sw/loft1-basel-city
128,Rheinfelden,https://files.eversports.com/b42766e6-b1ea-420...,SWISS MEGA PARK,rating,"4,5 (12 Rezensionen)","['Tennis', 'Badminton', 'Basketball', 'Eishock...","Schützenstrasse 2, 4402 Frenkendorf",https://www.eversports.de/sw/swiss-mega-park
129,Soest,https://files.eversports.com/eca53eeb-765a-4f6...,Aerial Studio,rating,"4,8 (16 Rezensionen)","['Poledance', 'Aerial Yoga', 'Aerial Silk', 'A...","Mississippidreef 2, 3565 CG Utrecht",https://www.eversports.de/sw/aerial-studio


In [None]:
df.to_csv("all_pole_studios_germany_&_Didi_not_validated_urls.csv", index=False)