In [9]:
from selenium import webdriver
from selenium.webdriver.chrome.service import Service
from selenium.webdriver.chrome.options import Options
from bs4 import BeautifulSoup
import time
import os
from tqdm import tqdm

# List of keywords to search for
keywords = ['Premium+', 'Premium', 'Bauteam', 'Spieler', 'Entwickler']

# Dictionary to store results
player_categories = {keyword: [] for keyword in keywords}

# Set up Chrome WebDriver
chrome_options = Options()
chrome_options.add_argument('--headless')
chrome_options.add_argument('--disable-gpu')  # Disable GPU acceleration
driver = webdriver.Chrome(options=chrome_options)

# Check OS
userOS = os.name

if "nt" in userOS: 
    directory = os.getcwd() + "\\in-new"
elif "posix" in userOS:
    directory = os.getcwd() + "/in-new"
else: 
    directory = None

file_names = []

for file in os.listdir(directory):
    if file.endswith(".txt") and "log" not in file:
        file_names.append(file[:-4])

# List of players, source from directory with previously scraped player names 
playerList = sorted(file_names)
renamed = ["BacardiSprite", "BearchenGott", "Livgo", "Lubotter2009"]

for i in renamed: 
    try: playerList.remove(i)
    except: ValueError(i + " not in list.")

# Add new players
newPlayers = ["ScreamingBlatz", "xX_Masha_ggg_Xx9", 'Dokkkkko', 'GamemasterNiki', 'Krusti']

for i in newPlayers:
    if i not in playerList:
        playerList.append(i)

playerList = sorted(playerList)

# Check for .txt files in the desktop path and add them to a list
desktop_path = os.path.expanduser("~/Desktop")
desktop_files = os.listdir(desktop_path)

for file in desktop_files:
    if file.endswith(".txt"):
        file = file[:-4]
    
    try: playerList.remove(file)
    except: pass

# Remove duplicates from playerList
playerList = list(dict.fromkeys(playerList))

# Function to scrape data for a single player
def scrape_player_data(player_name):
    url = f"https://stats.cytooxien.de/player/{player_name}"
    driver.get(url)
    time.sleep(3.3)  # Wait for 3.3 seconds for the page to fully load
    soup = BeautifulSoup(driver.page_source, 'html.parser')
    # Find all <span> elements with class "player-rank"
    player_ranks = soup.find_all('span', class_='player-rank')
    last_rank = None
    for rank in player_ranks:
        rank_text = rank.get_text(strip=True)  # Get the text content of the span
        if rank_text in keywords:
            player_categories[rank_text].append(player_name)
            last_rank = rank_text
    return last_rank

# Scrape data for all players and display progress bar
progress_bar = tqdm(playerList, desc="Scraping Progress", unit="player")
for player_name in progress_bar:
    last_rank = scrape_player_data(player_name)
    progress_bar.set_postfix(last_rank=last_rank)

# Print the results
for category, players in player_categories.items():
    print(f"{category}: {players}")

# Quit the WebDriver
driver.quit()


Scraping Progress: 100%|██████████| 89/89 [05:03<00:00,  3.42s/player, last_rank=Spieler]   

Premium+: ['Freeeedom', 'GamemasterNiki', 'Ninivee', 'Pedrozockt', 'PolizeiDreamy', 'Umgfoin', 'cxl1lo']
Premium: ['Chander24', 'Ex4cted', 'Harold_Sensemann', 'HerrDante', 'KakaMC', 'Kokochampo', 'Mincheeen', 'Raefinzs', 'Sebi1801', 'SpeckyCut', 'cediiiiii_10', 'twitchparaskiill', 'ymq_']
Bauteam: ['Fflopse', 'Kanickelul', 'marbrueck']
Spieler: ['Anni808', 'Axollotel', 'BusinessBent', 'ByNetherdude', 'Chrisi20101', 'DarkCobweb', 'DerBaumIstDerWeg', 'Dokkkkko', 'Falke23_5', 'ForceFox', 'GeneralEnte06', 'Gobo9', 'GrafikKatze', 'Grapfen', 'Gummibearchen', 'H1ghsay', 'JOW23', 'Jan2220', 'JennieKim', 'Joy_8oy', 'JustK1lling', 'Kokochampi', 'Krusti', 'Kyuudo', 'LeWi_100', 'LordAlexos', 'Luis_XYZ', 'M0orey_0', 'Martomias', 'MrNulfred', 'Oronor', 'Picutar', 'PixlNight', 'Radattel', 'Ritokii', 'Sackkerl', 'ScreamingBlatz', 'Seemops_8', 'Sey__', 'StaudammAusHolz', 'Tomiokey', 'Txlentierter', 'WirdNichtGeladen', 'Wissender', '_Waldi_', '_n3d', 'agowskyy', 'bawskey', 'crocodile1870', 'frutigall', 




In [14]:
player_categories.values()

dict_values([['Freeeedom', 'GamemasterNiki', 'Ninivee', 'Pedrozockt', 'PolizeiDreamy', 'Umgfoin', 'cxl1lo'], ['Chander24', 'Ex4cted', 'Harold_Sensemann', 'HerrDante', 'KakaMC', 'Kokochampo', 'Mincheeen', 'Raefinzs', 'Sebi1801', 'SpeckyCut', 'cediiiiii_10', 'twitchparaskiill', 'ymq_'], ['Fflopse', 'Kanickelul', 'marbrueck'], ['Anni808', 'Axollotel', 'BusinessBent', 'ByNetherdude', 'Chrisi20101', 'DarkCobweb', 'DerBaumIstDerWeg', 'Dokkkkko', 'Falke23_5', 'ForceFox', 'GeneralEnte06', 'Gobo9', 'GrafikKatze', 'Grapfen', 'Gummibearchen', 'H1ghsay', 'JOW23', 'Jan2220', 'JennieKim', 'Joy_8oy', 'JustK1lling', 'Kokochampi', 'Krusti', 'Kyuudo', 'LeWi_100', 'LordAlexos', 'Luis_XYZ', 'M0orey_0', 'Martomias', 'MrNulfred', 'Oronor', 'Picutar', 'PixlNight', 'Radattel', 'Ritokii', 'Sackkerl', 'ScreamingBlatz', 'Seemops_8', 'Sey__', 'StaudammAusHolz', 'Tomiokey', 'Txlentierter', 'WirdNichtGeladen', 'Wissender', '_Waldi_', '_n3d', 'agowskyy', 'bawskey', 'crocodile1870', 'frutigall', 'h4nnes', 'jimmi1410'