In [None]:
import os
import subprocess
import pandas as pd
import json
import time

# ============= CONFIG ============= #
XLSX_PATH = "Top500Website.xlsx"     
ROOT_DOMAIN_COLUMN = "Root Domain"  
CRAWLER_PATH = "Source/Crawler"
DETECTOR_PATH = "Source/Detector"
RESULTS_PATH = "Source/Results"
MAX_WEBSITES = 400  
# ================================== #


def normalize_domain(domain: str) -> str:
    domain = domain.strip()
    if domain.startswith("http://") or domain.startswith("https://"):
        return domain
    return "https://" + domain


def domain_to_folder(domain: str) -> str:
    """Convert domain like 'www.bbc.com' into folder name: www_bbc_com."""
    return (
        domain.replace("https://", "")
            .replace("http://", "")
            .replace(".", "_")
    )


# Retry Mechanism for Crawler & Detector 
def run_crawler_with_retry(url, retries=1):
    for attempt in range(1, retries + 1):
        print(f"\nüîÅ Crawler attempt {attempt}/{retries} for {url}")
        result = subprocess.run(["node", "app.js", url], cwd=CRAWLER_PATH)
        if result.returncode == 0:
            print("‚úÖ Crawler success")
            return True
        print("‚ùå Crawler failed, retrying...")
        time.sleep(2)
    print("‚õî Crawler failed after 3 attempts")
    return False


def run_detector_with_retry(folder_path, retries=3):
    for attempt in range(1, retries + 1):
        print(f"\nüîÅ Detector attempt {attempt}/{retries} for {folder_path}")
        result = subprocess.run(["node", "app.js", folder_path], cwd=DETECTOR_PATH)
        if result.returncode == 0:
            print("‚úÖ Detector success")
            return True
        print("‚ùå Detector failed, retrying...")
        time.sleep(2)
    print("‚õî Detector failed after 3 attempts")
    return False


# Inline Analyzer
def parse_results_inlined(results_dir="Source/Results"):
    data = []
    website_dirs = [
        d for d in os.listdir(results_dir)
        if os.path.isdir(os.path.join(results_dir, d))
    ]
    for site_dir in website_dirs:
        result_path = os.path.join(results_dir, site_dir, "result.json")
        if not os.path.exists(result_path):
            print(f"‚ö†Ô∏è result.json NOT found for {site_dir}, skipping.")
            continue
        try:
            with open(result_path, "r") as f:
                result = json.load(f)
        except json.JSONDecodeError:
            print(f"‚ö†Ô∏è JSON decode error for {site_dir}, skipping.")
            continue
        # Extract violation counts
        id_leaking_count = len(result.get("idLeaking", []))
        cookie_sync_count = len(result.get("cookieSync", []))
        fingerprinting_obj = result.get("fingerprinting", {})
        fingerprinting_count = len(fingerprinting_obj.get("functions", []))
        total_violations = (
                id_leaking_count +
                cookie_sync_count +
                fingerprinting_count
        )
        is_compliant = (total_violations == 0)
        website_name = site_dir.replace("www_", "").replace("_", ".")
        data.append({
            "Website": website_name,
            "ID_Leaking_Count": id_leaking_count,
            "Cookie_Sync_Count": cookie_sync_count,
            "Fingerprinting_Count": fingerprinting_count,
            "Total_Violations": total_violations,
            "Is_Compliant": is_compliant
        })
    return pd.DataFrame(data)


def main():
    print("üìÑ Reading Excel file:", XLSX_PATH)
    df = pd.read_excel(XLSX_PATH)
    if ROOT_DOMAIN_COLUMN not in df.columns:
        print(f"‚ùå ERROR: Column '{ROOT_DOMAIN_COLUMN}' not found in Excel!")
        return
    domains = df[ROOT_DOMAIN_COLUMN].dropna().astype(str).tolist()
    domains = domains[:MAX_WEBSITES]
    print(f"üåê Loaded {len(domains)} domains (processing first {MAX_WEBSITES}).")
    os.makedirs(RESULTS_PATH, exist_ok=True)
    # Process each website
    for i, domain in enumerate(domains, 1):
        print("\n============================")
        print(f"üöÄ Processing website {i}/{MAX_WEBSITES}: {domain}")
        print("============================")
        url = normalize_domain(domain)
        folder_name = domain_to_folder(domain)
        website_result_dir = os.path.join(RESULTS_PATH, folder_name)
        os.makedirs(website_result_dir, exist_ok=True)
        result_json_path = os.path.join(website_result_dir, "result.json")
        if os.path.exists(result_json_path):
            print(f"‚è≠Ô∏è Skipping {domain} (result.json already exists)")
            continue
        # --- Step 1: Crawler with Retry ---
        if not run_crawler_with_retry(url):
            print(f"üö´ Skipping {domain} due to Crawler failure")
            continue
        time.sleep(2)
        # --- Step 2: Detector with Retry ---
        detector_path = "../Results/" + folder_name
        if not run_detector_with_retry(detector_path):
            print(f"üö´ Skipping {domain} due to Detector failure")
            continue
        time.sleep(1)
    # Final Analysis
    print("\nüìä Running final analysis‚Ä¶\n")
    df_result = parse_results_inlined(RESULTS_PATH)
    if not df_result.empty:
        output_path = "Result.xlsx"
        df_result.to_excel(output_path, index=False)
        print(f"‚úÖ Result saved to: {output_path}")
        print("\n--- Compliance Summary ---")
        print(df_result)
        compliant = df_result["Is_Compliant"].sum()
        total = len(df_result)
        non_compliant = total - compliant
        print(f"\nTotal Sites: {total}")
        print(f"Compliant: {compliant}")
        print(f"Non-Compliant: {non_compliant}")
        print(f"Non-Compliance Rate: {non_compliant / total * 100:.2f}%")
    else:
        print("‚ö†Ô∏è No valid result.json files found.")
    print("\nüéâ ALL DONE!")


if __name__ == "__main__":
    main()

üìÑ Reading Excel file: Top500Website.xlsx
üåê Loaded 400 domains (processing first 400).

üöÄ Processing website 1/400: www.google.com
‚è≠Ô∏è Skipping www.google.com (result.json already exists)

üöÄ Processing website 2/400: www.blogger.com
‚è≠Ô∏è Skipping www.blogger.com (result.json already exists)

üöÄ Processing website 3/400: youtube.com
‚è≠Ô∏è Skipping youtube.com (result.json already exists)

üöÄ Processing website 4/400: linkedin.com
‚è≠Ô∏è Skipping linkedin.com (result.json already exists)

üöÄ Processing website 5/400: support.google.com
‚è≠Ô∏è Skipping support.google.com (result.json already exists)

üöÄ Processing website 6/400: cloudflare.com
‚è≠Ô∏è Skipping cloudflare.com (result.json already exists)

üöÄ Processing website 7/400: microsoft.com
‚è≠Ô∏è Skipping microsoft.com (result.json already exists)

üöÄ Processing website 8/400: apple.com
‚è≠Ô∏è Skipping apple.com (result.json already exists)

üöÄ Processing website 9/400: en.wikipedia.org
‚è≠Ô∏è Skipping

Error at https://bp.blogspot.com:  Error: net::ERR_NAME_NOT_RESOLVED at https://bp.blogspot.com
    at navigate [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:155:23[90m)[39m
[90m    at process.processTicksAndRejections (node:internal/process/task_queues:105:5)[39m
    at async FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:130:21[90m)[39m
    at async Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:16[90m)[39m
    at async Page.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:1167:16[90m)[39m
    at async Scrape [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mdriver/scra

‚õî Crawler failed after 3 attempts
üö´ Skipping bp.blogspot.com due to Crawler failure

üöÄ Processing website 18/400: sites.google.com
‚è≠Ô∏è Skipping sites.google.com (result.json already exists)

üöÄ Processing website 19/400: googleusercontent.com
‚è≠Ô∏è Skipping googleusercontent.com (result.json already exists)

üöÄ Processing website 20/400: accounts.google.com
‚è≠Ô∏è Skipping accounts.google.com (result.json already exists)

üöÄ Processing website 21/400: t.me
‚è≠Ô∏è Skipping t.me (result.json already exists)

üöÄ Processing website 22/400: europa.eu
‚è≠Ô∏è Skipping europa.eu (result.json already exists)

üöÄ Processing website 23/400: plus.google.com
‚è≠Ô∏è Skipping plus.google.com (result.json already exists)

üöÄ Processing website 24/400: whatsapp.com
‚è≠Ô∏è Skipping whatsapp.com (result.json already exists)

üöÄ Processing website 25/400: adobe.com
‚è≠Ô∏è Skipping adobe.com (result.json already exists)

üöÄ Processing website 26/400: facebook.com
‚è≠Ô∏è Skipping

Error at https://uol.com.br:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping uol.com.br due to Crawler failure

üöÄ Processing website 29/400: istockphoto.com
‚è≠Ô∏è Skipping istockphoto.com (result.json already exists)

üöÄ Processing website 30/400: vimeo.com
‚è≠Ô∏è Skipping vimeo.com (result.json already exists)

üöÄ Processing website 31/400: vk.com
‚è≠Ô∏è Skipping vk.com (result.json already exists)

üöÄ Processing website 32/400: github.com
‚è≠Ô∏è Skipping github.com (result.json already exists)

üöÄ Processing website 33/400: amazon.com
‚è≠Ô∏è Skipping amazon.com (result.json already exists)

üöÄ Processing website 34/400: search.google.com
‚è≠Ô∏è Skipping search.google.com (result.json already exists)

üöÄ Processing website 35/400: bbc.co.uk
‚è≠Ô∏è Skipping bbc.co.uk (result.json already exists)

üöÄ Processing website 36/400: google.de
‚è≠Ô∏è Skipping google.de (result.json already exists)

üöÄ Processing website 37/400: live.com
‚è≠Ô

Error at https://jimdofree.com:  ProtocolError: Protocol error (Page.navigate): Target closed.
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Connection.js:226:24
    at new Promise (<anonymous>)
    at CDPSession.send [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Connection.js:222:16[90m)[39m
    at navigate [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:148:47[90m)[39m
    at FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:131:13[90m)[39m
    at Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:41[90m)[39m
    at Page.got

‚õî Crawler failed after 3 attempts
üö´ Skipping jimdofree.com due to Crawler failure

üöÄ Processing website 74/400: cpanel.net
‚è≠Ô∏è Skipping cpanel.net (result.json already exists)

üöÄ Processing website 75/400: imdb.com
‚è≠Ô∏è Skipping imdb.com (result.json already exists)

üöÄ Processing website 76/400: wa.me
‚è≠Ô∏è Skipping wa.me (result.json already exists)

üöÄ Processing website 77/400: feedburner.com
‚è≠Ô∏è Skipping feedburner.com (result.json already exists)

üöÄ Processing website 78/400: enable-javascript.com

üîÅ Crawler attempt 1/1 for https://enable-javascript.com
Application Started: [ 11/30/2025, 10:35:23 PM ]

[INFO] Crawling https://enable-javascript.com
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/enable-javascript_com
Application Started: [ 11/30/2025, 10:35:34 PM ]

[INFO] Processing ../Res

Operation failed for ../Results/enable-javascript_com: Error: ENOENT: no such file or directory, open '../Results/enable-javascript_com/cookies.json'
[90m    at Object.readFileSync (node:fs:441:20)[39m
    at LoadData [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mhelpers/storage.js:13:21[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:21:30[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:internal/modules/cjs/loader:1706:14)[39m
[90m    at Object..js (node:internal/modules/cjs/loader:1839:10)[39m
[90m    at Module.load (node:internal/modules/cjs/loader:1441:32)[39m
[90m    at Function._load (


üîÅ Detector attempt 2/3 for ../Results/enable-javascript_com
Application Started: [ 11/30/2025, 10:35:36 PM ]

[INFO] Processing ../Results/enable-javascript_com
‚ùå Detector failed, retrying...


Operation failed for ../Results/enable-javascript_com: Error: ENOENT: no such file or directory, open '../Results/enable-javascript_com/cookies.json'
[90m    at Object.readFileSync (node:fs:441:20)[39m
    at LoadData [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mhelpers/storage.js:13:21[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:21:30[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:internal/modules/cjs/loader:1706:14)[39m
[90m    at Object..js (node:internal/modules/cjs/loader:1839:10)[39m
[90m    at Module.load (node:internal/modules/cjs/loader:1441:32)[39m
[90m    at Function._load (


üîÅ Detector attempt 3/3 for ../Results/enable-javascript_com
Application Started: [ 11/30/2025, 10:35:39 PM ]

[INFO] Processing ../Results/enable-javascript_com
‚ùå Detector failed, retrying...


Operation failed for ../Results/enable-javascript_com: Error: ENOENT: no such file or directory, open '../Results/enable-javascript_com/cookies.json'
[90m    at Object.readFileSync (node:fs:441:20)[39m
    at LoadData [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mhelpers/storage.js:13:21[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:21:30[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:internal/modules/cjs/loader:1706:14)[39m
[90m    at Object..js (node:internal/modules/cjs/loader:1839:10)[39m
[90m    at Module.load (node:internal/modules/cjs/loader:1441:32)[39m
[90m    at Function._load (

‚õî Detector failed after 3 attempts
üö´ Skipping enable-javascript.com due to Detector failure

üöÄ Processing website 79/400: nytimes.com
‚è≠Ô∏è Skipping nytimes.com (result.json already exists)

üöÄ Processing website 80/400: workspace.google.com
‚è≠Ô∏è Skipping workspace.google.com (result.json already exists)

üöÄ Processing website 81/400: ok.ru
‚è≠Ô∏è Skipping ok.ru (result.json already exists)

üöÄ Processing website 82/400: google.es
‚è≠Ô∏è Skipping google.es (result.json already exists)

üöÄ Processing website 83/400: dailymotion.com
‚è≠Ô∏è Skipping dailymotion.com (result.json already exists)

üöÄ Processing website 84/400: afternic.com
‚è≠Ô∏è Skipping afternic.com (result.json already exists)

üöÄ Processing website 85/400: bloomberg.com
‚è≠Ô∏è Skipping bloomberg.com (result.json already exists)

üöÄ Processing website 86/400: amazon.de
‚è≠Ô∏è Skipping amazon.de (result.json already exists)

üöÄ Processing website 87/400: photos.google.com
‚è≠Ô∏è Skipping photos.g

Error at https://indiatimes.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping indiatimes.com due to Crawler failure

üöÄ Processing website 91/400: youronlinechoices.com
‚è≠Ô∏è Skipping youronlinechoices.com (result.json already exists)

üöÄ Processing website 92/400: elpais.com
‚è≠Ô∏è Skipping elpais.com (result.json already exists)

üöÄ Processing website 93/400: tinyurl.com
‚è≠Ô∏è Skipping tinyurl.com (result.json already exists)

üöÄ Processing website 94/400: yadi.sk
‚è≠Ô∏è Skipping yadi.sk (result.json already exists)

üöÄ Processing website 95/400: spotify.com
‚è≠Ô∏è Skipping spotify.com (result.json already exists)

üöÄ Processing website 96/400: huffpost.com

üîÅ Crawler attempt 1/1 for https://huffpost.com
Application Started: [ 11/30/2025, 10:36:27 PM ]

[INFO] Crawling https://huffpost.com
[INFO] Created browser instance
[INFO] Visiting website...


Error at https://huffpost.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping huffpost.com due to Crawler failure

üöÄ Processing website 97/400: ru.wikipedia.org
‚è≠Ô∏è Skipping ru.wikipedia.org (result.json already exists)

üöÄ Processing website 98/400: google.fr
‚è≠Ô∏è Skipping google.fr (result.json already exists)

üöÄ Processing website 99/400: webmd.com
‚è≠Ô∏è Skipping webmd.com (result.json already exists)

üöÄ Processing website 100/400: samsung.com
‚è≠Ô∏è Skipping samsung.com (result.json already exists)

üöÄ Processing website 101/400: independent.co.uk

üîÅ Crawler attempt 1/1 for https://independent.co.uk
Application Started: [ 11/30/2025, 10:37:13 PM ]

[INFO] Crawling https://independent.co.uk
[INFO] Created browser instance
[INFO] Visiting website...


Error at https://independent.co.uk:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping independent.co.uk due to Crawler failure

üöÄ Processing website 102/400: amazon.co.jp
‚è≠Ô∏è Skipping amazon.co.jp (result.json already exists)

üöÄ Processing website 103/400: get.google.com
‚è≠Ô∏è Skipping get.google.com (result.json already exists)

üöÄ Processing website 104/400: amazon.co.uk
‚è≠Ô∏è Skipping amazon.co.uk (result.json already exists)

üöÄ Processing website 105/400: 4shared.com
‚è≠Ô∏è Skipping 4shared.com (result.json already exists)

üöÄ Processing website 106/400: telegram.me
‚è≠Ô∏è Skipping telegram.me (result.json already exists)

üöÄ Processing website 107/400: planalto.gov.br
‚è≠Ô∏è Skipping planalto.gov.br (result.json already exists)

üöÄ Processing website 108/400: businessinsider.com
‚è≠Ô∏è Skipping businessinsider.com (result.json already exists)

üöÄ Processing website 109/400: ig.com.br
‚è≠Ô∏è Skipping ig.com.br (result.json already exi

Error at https://huffingtonpost.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping huffingtonpost.com due to Crawler failure

üöÄ Processing website 120/400: bbc.com
‚è≠Ô∏è Skipping bbc.com (result.json already exists)

üöÄ Processing website 121/400: estadao.com.br
‚è≠Ô∏è Skipping estadao.com.br (result.json already exists)

üöÄ Processing website 122/400: nature.com
‚è≠Ô∏è Skipping nature.com (result.json already exists)

üöÄ Processing website 123/400: mediafire.com
‚è≠Ô∏è Skipping mediafire.com (result.json already exists)

üöÄ Processing website 124/400: washingtonpost.com
‚è≠Ô∏è Skipping washingtonpost.com (result.json already exists)

üöÄ Processing website 125/400: forms.gle
‚è≠Ô∏è Skipping forms.gle (result.json already exists)

üöÄ Processing website 126/400: namecheap.com
‚è≠Ô∏è Skipping namecheap.com (result.json already exists)

üöÄ Processing website 127/400: forbes.com
‚è≠Ô∏è Skipping forbes.com (result.json already exists)

üöÄ Proces

Error at https://marketingplatform.google....:  Error: net::ERR_NAME_NOT_RESOLVED at https://marketingplatform.google....
    at navigate [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:155:23[90m)[39m
[90m    at process.processTicksAndRejections (node:internal/process/task_queues:105:5)[39m
    at async FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:130:21[90m)[39m
    at async Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:16[90m)[39m
    at async Page.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:1167:16[90m)[39m
    at async Scrape [90m(/Users/qie/Desktop/consent-guard-main/Sourc

‚õî Crawler failed after 3 attempts
üö´ Skipping marketingplatform.google.... due to Crawler failure

üöÄ Processing website 132/400: domainmarket.com
‚è≠Ô∏è Skipping domainmarket.com (result.json already exists)

üöÄ Processing website 133/400: ytimg.com

üîÅ Crawler attempt 1/1 for https://ytimg.com
Application Started: [ 11/30/2025, 10:38:50 PM ]

[INFO] Crawling https://ytimg.com
[INFO] Created browser instance
[INFO] Visiting website...
[ERROR] No traces collected
‚ùå Crawler failed, retrying...


Error at https://ytimg.com:  Error: net::ERR_NAME_NOT_RESOLVED at https://ytimg.com
    at navigate [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:155:23[90m)[39m
[90m    at process.processTicksAndRejections (node:internal/process/task_queues:105:5)[39m
    at async FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:130:21[90m)[39m
    at async Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:16[90m)[39m
    at async Page.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:1167:16[90m)[39m
    at async Scrape [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mdriver/scrape.js:40:5[

‚õî Crawler failed after 3 attempts
üö´ Skipping ytimg.com due to Crawler failure

üöÄ Processing website 134/400: terra.com.br
‚è≠Ô∏è Skipping terra.com.br (result.json already exists)

üöÄ Processing website 135/400: google.co.uk
‚è≠Ô∏è Skipping google.co.uk (result.json already exists)

üöÄ Processing website 136/400: shutterstock.com
‚è≠Ô∏è Skipping shutterstock.com (result.json already exists)

üöÄ Processing website 137/400: dailymail.co.uk
‚è≠Ô∏è Skipping dailymail.co.uk (result.json already exists)

üöÄ Processing website 138/400: reg.ru
‚è≠Ô∏è Skipping reg.ru (result.json already exists)

üöÄ Processing website 139/400: t.co
‚è≠Ô∏è Skipping t.co (result.json already exists)

üöÄ Processing website 140/400: cdc.gov
‚è≠Ô∏è Skipping cdc.gov (result.json already exists)

üöÄ Processing website 141/400: thesun.co.uk

üîÅ Crawler attempt 1/1 for https://thesun.co.uk
Application Started: [ 11/30/2025, 10:38:53 PM ]

[INFO] Crawling https://thesun.co.uk
[INFO] Created browse

Error at https://list-manage.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111
    at async FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:130:21[90m)[39m
    at async Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:16[90m)[39m
    at async Page.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:1167:16[90m)[39m
    at async Scrape [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mdriver/scrape.js:40:5[90m)[39m
    at async CollectTraces [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mapp

[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping list-manage.com due to Crawler failure

üöÄ Processing website 150/400: msn.com
‚è≠Ô∏è Skipping msn.com (result.json already exists)

üöÄ Processing website 151/400: un.org
‚è≠Ô∏è Skipping un.org (result.json already exists)

üöÄ Processing website 152/400: de.wikipedia.org
‚è≠Ô∏è Skipping de.wikipedia.org (result.json already exists)

üöÄ Processing website 153/400: ovh.com
‚è≠Ô∏è Skipping ovh.com (result.json already exists)

üöÄ Processing website 154/400: mail.ru
‚è≠Ô∏è Skipping mail.ru (result.json already exists)

üöÄ Processing website 155/400: bing.com
‚è≠Ô∏è Skipping bing.com (result.json already exists)

üöÄ Processing website 156/400: news.yahoo.com

üîÅ Crawler attempt 1/1 for https://news.yahoo.com
Application Started: [ 11/30/2025, 10:40:02 PM ]

[INFO] Crawling https://news.yahoo.com
[INFO] Created browser instance
[INFO] Visiting website...


Error at https://news.yahoo.com:  Error: Navigation failed because browser has disconnected!
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:51:147
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/vendor/mitt/src/index.js:51:62
    at Array.map (<anonymous>)
    at Object.emit [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/vendor/mitt/src/index.js:51:43[90m)[39m
    at CDPSession.emit [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/EventEmitter.js:72:22[90m)[39m
    at CDPSession._onClosed [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Connection.js:267:14[90m)[39m
    at Connection._onClose [90m(/Users/qie/Desktop/consen

[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping news.yahoo.com due to Crawler failure

üöÄ Processing website 157/400: myaccount.google.com
‚è≠Ô∏è Skipping myaccount.google.com (result.json already exists)

üöÄ Processing website 158/400: hatena.ne.jp
‚è≠Ô∏è Skipping hatena.ne.jp (result.json already exists)

üöÄ Processing website 159/400: shopify.com
‚è≠Ô∏è Skipping shopify.com (result.json already exists)

üöÄ Processing website 160/400: adssettings.google.com
‚è≠Ô∏è Skipping adssettings.google.com (result.json already exists)

üöÄ Processing website 161/400: bit.ly
‚è≠Ô∏è Skipping bit.ly (result.json already exists)

üöÄ Processing website 162/400: reuters.com
‚è≠Ô∏è Skipping reuters.com (result.json already exists)

üöÄ Processing website 163/400: booking.com
‚è≠Ô∏è Skipping booking.com (result.json already exists)

üöÄ Processing website 164/400: discord.com
‚è≠Ô∏è Skipping discord.com (result.json already exis

Operation failed for ../Results/nasa_gov: AssertionError [ERR_ASSERTION]: The expression evaluated to a falsy value:

  assert(Cookies.IsCookieValid(cookie))

    at [90m/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:206:9
    at Array.forEach (<anonymous>)
    at CookieLeak [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:205:13[90m)[39m
    at IdLeaking [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:228:12[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:37:25[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:inter


üîÅ Detector attempt 2/3 for ../Results/nasa_gov
Application Started: [ 11/30/2025, 10:40:31 PM ]

[INFO] Processing ../Results/nasa_gov
[INFO] Loaded data
‚ùå Detector failed, retrying...


Operation failed for ../Results/nasa_gov: AssertionError [ERR_ASSERTION]: The expression evaluated to a falsy value:

  assert(Cookies.IsCookieValid(cookie))

    at [90m/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:206:9
    at Array.forEach (<anonymous>)
    at CookieLeak [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:205:13[90m)[39m
    at IdLeaking [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:228:12[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:37:25[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:inter


üîÅ Detector attempt 3/3 for ../Results/nasa_gov
Application Started: [ 11/30/2025, 10:40:33 PM ]

[INFO] Processing ../Results/nasa_gov
[INFO] Loaded data
‚ùå Detector failed, retrying...


Operation failed for ../Results/nasa_gov: AssertionError [ERR_ASSERTION]: The expression evaluated to a falsy value:

  assert(Cookies.IsCookieValid(cookie))

    at [90m/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:206:9
    at Array.forEach (<anonymous>)
    at CookieLeak [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:205:13[90m)[39m
    at IdLeaking [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:228:12[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:37:25[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:inter

‚õî Detector failed after 3 attempts
üö´ Skipping nasa.gov due to Detector failure

üöÄ Processing website 167/400: aboutads.info
‚è≠Ô∏è Skipping aboutads.info (result.json already exists)

üöÄ Processing website 168/400: time.com
‚è≠Ô∏è Skipping time.com (result.json already exists)

üöÄ Processing website 169/400: abril.com.br

üîÅ Crawler attempt 1/1 for https://abril.com.br
Application Started: [ 11/30/2025, 10:40:35 PM ]

[INFO] Crawling https://abril.com.br
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/abril_com_br
Application Started: [ 11/30/2025, 10:40:48 PM ]

[INFO] Processing ../Results/abril_com_br
[INFO] Loaded data
‚ùå Detector failed, retrying...


Operation failed for ../Results/abril_com_br: AssertionError [ERR_ASSERTION]: The expression evaluated to a falsy value:

  assert(Cookies.IsCookieValid(cookie))

    at [90m/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:206:9
    at Array.forEach (<anonymous>)
    at CookieLeak [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:205:13[90m)[39m
    at IdLeaking [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:228:12[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:37:25[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:i


üîÅ Detector attempt 2/3 for ../Results/abril_com_br
Application Started: [ 11/30/2025, 10:40:50 PM ]

[INFO] Processing ../Results/abril_com_br
[INFO] Loaded data
‚ùå Detector failed, retrying...


Operation failed for ../Results/abril_com_br: AssertionError [ERR_ASSERTION]: The expression evaluated to a falsy value:

  assert(Cookies.IsCookieValid(cookie))

    at [90m/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:206:9
    at Array.forEach (<anonymous>)
    at CookieLeak [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:205:13[90m)[39m
    at IdLeaking [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:228:12[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:37:25[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:i


üîÅ Detector attempt 3/3 for ../Results/abril_com_br
Application Started: [ 11/30/2025, 10:40:52 PM ]

[INFO] Processing ../Results/abril_com_br
[INFO] Loaded data
‚ùå Detector failed, retrying...


Operation failed for ../Results/abril_com_br: AssertionError [ERR_ASSERTION]: The expression evaluated to a falsy value:

  assert(Cookies.IsCookieValid(cookie))

    at [90m/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:206:9
    at Array.forEach (<anonymous>)
    at CookieLeak [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:205:13[90m)[39m
    at IdLeaking [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mdetectors/leaks.js:228:12[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:37:25[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:i

‚õî Detector failed after 3 attempts
üö´ Skipping abril.com.br due to Detector failure

üöÄ Processing website 170/400: change.org
‚è≠Ô∏è Skipping change.org (result.json already exists)

üöÄ Processing website 171/400: nginx.org
‚è≠Ô∏è Skipping nginx.org (result.json already exists)

üöÄ Processing website 172/400: twitter.com
‚è≠Ô∏è Skipping twitter.com (result.json already exists)

üöÄ Processing website 173/400: www.wikipedia.org
‚è≠Ô∏è Skipping www.wikipedia.org (result.json already exists)

üöÄ Processing website 174/400: archive.org
‚è≠Ô∏è Skipping archive.org (result.json already exists)

üöÄ Processing website 175/400: cbsnews.com
‚è≠Ô∏è Skipping cbsnews.com (result.json already exists)

üöÄ Processing website 176/400: networkadvertising.org
‚è≠Ô∏è Skipping networkadvertising.org (result.json already exists)

üöÄ Processing website 177/400: telegraph.co.uk
‚è≠Ô∏è Skipping telegraph.co.uk (result.json already exists)

üöÄ Processing website 178/400: pinterest.com
‚è≠Ô

Error at https://windows.net:  Error: net::ERR_CERT_COMMON_NAME_INVALID at https://windows.net
    at navigate [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:155:23[90m)[39m
[90m    at process.processTicksAndRejections (node:internal/process/task_queues:105:5)[39m
    at async FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:130:21[90m)[39m
    at async Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:16[90m)[39m
    at async Page.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:1167:16[90m)[39m
    at async Scrape [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mdriver/scrap

[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping windows.net due to Crawler failure

üöÄ Processing website 186/400: alicdn.com

üîÅ Crawler attempt 1/1 for https://alicdn.com
Application Started: [ 11/30/2025, 10:40:58 PM ]

[INFO] Crawling https://alicdn.com
[INFO] Created browser instance
[INFO] Visiting website...


Error at https://alicdn.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111
    at async FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:130:21[90m)[39m
    at async Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:16[90m)[39m
    at async Page.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:1167:16[90m)[39m
    at async Scrape [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mdriver/scrape.js:40:5[90m)[39m
    at async CollectTraces [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mapp.js:3

[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping alicdn.com due to Crawler failure

üöÄ Processing website 187/400: google.ca
‚è≠Ô∏è Skipping google.ca (result.json already exists)

üöÄ Processing website 188/400: lemonde.fr
‚è≠Ô∏è Skipping lemonde.fr (result.json already exists)

üöÄ Processing website 189/400: newyorker.com
‚è≠Ô∏è Skipping newyorker.com (result.json already exists)

üöÄ Processing website 190/400: webnode.page
‚è≠Ô∏è Skipping webnode.page (result.json already exists)

üöÄ Processing website 191/400: surveymonkey.com
‚è≠Ô∏è Skipping surveymonkey.com (result.json already exists)

üöÄ Processing website 192/400: translate.google.com
‚è≠Ô∏è Skipping translate.google.com (result.json already exists)

üöÄ Processing website 193/400: calendar.google.com
‚è≠Ô∏è Skipping calendar.google.com (result.json already exists)

üöÄ Processing website 194/400: amazonaws.com

üîÅ Crawler attempt 1/1 for https://amazo

Error at https://amazonaws.com:  Error: net::ERR_CONNECTION_REFUSED at https://amazonaws.com
    at navigate [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:155:23[90m)[39m
[90m    at process.processTicksAndRejections (node:internal/process/task_queues:105:5)[39m
    at async FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:130:21[90m)[39m
    at async Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:16[90m)[39m
    at async Page.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:1167:16[90m)[39m
    at async Scrape [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mdriver/scrape.

[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping amazonaws.com due to Crawler failure

üöÄ Processing website 195/400: academia.edu
‚è≠Ô∏è Skipping academia.edu (result.json already exists)

üöÄ Processing website 196/400: apache.org
‚è≠Ô∏è Skipping apache.org (result.json already exists)

üöÄ Processing website 197/400: imageshack.us
‚è≠Ô∏è Skipping imageshack.us (result.json already exists)

üöÄ Processing website 198/400: akamaihd.net

üîÅ Crawler attempt 1/1 for https://akamaihd.net
Application Started: [ 11/30/2025, 10:41:48 PM ]

[INFO] Crawling https://akamaihd.net
[INFO] Created browser instance
[INFO] Visiting website...


Error at https://akamaihd.net:  Error: net::ERR_NAME_NOT_RESOLVED at https://akamaihd.net
    at navigate [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:155:23[90m)[39m
[90m    at process.processTicksAndRejections (node:internal/process/task_queues:105:5)[39m
    at async FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:130:21[90m)[39m
    at async Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:16[90m)[39m
    at async Page.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:1167:16[90m)[39m
    at async Scrape [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mdriver/scrape.js:

[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping akamaihd.net due to Crawler failure

üöÄ Processing website 199/400: nginx.com
‚è≠Ô∏è Skipping nginx.com (result.json already exists)

üöÄ Processing website 200/400: discord.gg
‚è≠Ô∏è Skipping discord.gg (result.json already exists)

üöÄ Processing website 201/400: thetimes.co.uk
‚è≠Ô∏è Skipping thetimes.co.uk (result.json already exists)

üöÄ Processing website 202/400: search.yahoo.com

üîÅ Crawler attempt 1/1 for https://search.yahoo.com
Application Started: [ 11/30/2025, 10:41:51 PM ]

[INFO] Crawling https://search.yahoo.com
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/search_yahoo_com
Application Started: [ 11/30/2025, 10:42:01 PM ]

[INFO] Processing ../Results/search_yahoo_com
[INFO] Loaded data
[INF

Error at https://ggpht.com:  Error: net::ERR_NAME_NOT_RESOLVED at https://ggpht.com
    at navigate [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:155:23[90m)[39m
[90m    at process.processTicksAndRejections (node:internal/process/task_queues:105:5)[39m
    at async FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:130:21[90m)[39m
    at async Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:16[90m)[39m
    at async Page.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:1167:16[90m)[39m
    at async Scrape [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mdriver/scrape.js:40:5[

[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping ggpht.com due to Crawler failure

üöÄ Processing website 211/400: privacyshield.gov

üîÅ Crawler attempt 1/1 for https://privacyshield.gov
Application Started: [ 11/30/2025, 10:42:05 PM ]

[INFO] Crawling https://privacyshield.gov
[INFO] Created browser instance
[INFO] Visiting website...


Error at https://privacyshield.gov:  Error: net::ERR_CONNECTION_RESET at https://privacyshield.gov
    at navigate [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:155:23[90m)[39m
[90m    at process.processTicksAndRejections (node:internal/process/task_queues:105:5)[39m
    at async FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:130:21[90m)[39m
    at async Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:16[90m)[39m
    at async Page.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:1167:16[90m)[39m
    at async Scrape [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mdriver/s

[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping privacyshield.gov due to Crawler failure

üöÄ Processing website 212/400: www.over-blog.com

üîÅ Crawler attempt 1/1 for https://www.over-blog.com
Application Started: [ 11/30/2025, 10:42:09 PM ]

[INFO] Crawling https://www.over-blog.com
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[ERROR] No traces collected
‚ùå Crawler failed, retrying...


Error at https://www.over-blog.com:  Error: Protocol error (Network.getCookies): Session closed. Most likely the page has been closed.
    at CDPSession.send [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Connection.js:214:35[90m)[39m
    at Page.cookies [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Page.js:733:53[90m)[39m
    at Object.GetFirstPartyCookies [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mscrapers/cookies.js:26:23[90m)[39m
    at Scrape [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mdriver/scrape.js:45:46[90m)[39m
    at async CollectTraces [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mapp.js:32:24[90m)[39m
    at async main [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mapp.js:83:24[90m)[39m


‚õî Crawler failed after 3 attempts
üö´ Skipping www.over-blog.com due to Crawler failure

üöÄ Processing website 213/400: clarin.com

üîÅ Crawler attempt 1/1 for https://clarin.com
Application Started: [ 11/30/2025, 10:42:21 PM ]

[INFO] Crawling https://clarin.com
[INFO] Created browser instance
[INFO] Visiting website...


Error at https://clarin.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping clarin.com due to Crawler failure

üöÄ Processing website 214/400: www.wix.com
‚è≠Ô∏è Skipping www.wix.com (result.json already exists)

üöÄ Processing website 215/400: whitehouse.gov
‚è≠Ô∏è Skipping whitehouse.gov (result.json already exists)

üöÄ Processing website 216/400: icann.org
‚è≠Ô∏è Skipping icann.org (result.json already exists)

üöÄ Processing website 217/400: gnu.org
‚è≠Ô∏è Skipping gnu.org (result.json already exists)

üöÄ Processing website 218/400: yandex.ru
‚è≠Ô∏è Skipping yandex.ru (result.json already exists)

üöÄ Processing website 219/400: francetvinfo.fr

üîÅ Crawler attempt 1/1 for https://francetvinfo.fr
Application Started: [ 11/30/2025, 10:43:05 PM ]

[INFO] Crawling https://francetvinfo.fr
[INFO] Created browser instance
[INFO] Visiting website...


Error at https://francetvinfo.fr:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping francetvinfo.fr due to Crawler failure

üöÄ Processing website 220/400: gmail.com
‚è≠Ô∏è Skipping gmail.com (result.json already exists)

üöÄ Processing website 221/400: mozilla.com
‚è≠Ô∏è Skipping mozilla.com (result.json already exists)

üöÄ Processing website 222/400: ziddu.com
‚è≠Ô∏è Skipping ziddu.com (result.json already exists)

üöÄ Processing website 223/400: guardian.co.uk
‚è≠Ô∏è Skipping guardian.co.uk (result.json already exists)

üöÄ Processing website 224/400: twitch.tv
‚è≠Ô∏è Skipping twitch.tv (result.json already exists)

üöÄ Processing website 225/400: sedo.com
‚è≠Ô∏è Skipping sedo.com (result.json already exists)

üöÄ Processing website 226/400: foxnews.com
‚è≠Ô∏è Skipping foxnews.com (result.json already exists)

üöÄ Processing website 227/400: rambler.ru
‚è≠Ô∏è Skipping rambler.ru (result.json already exists)

üöÄ Processing website 228/400: books.g

Error at https://sfgate.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping sfgate.com due to Crawler failure

üöÄ Processing website 234/400: liveinternet.ru

üîÅ Crawler attempt 1/1 for https://liveinternet.ru
Application Started: [ 11/30/2025, 10:44:36 PM ]

[INFO] Crawling https://liveinternet.ru
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/liveinternet_ru
Application Started: [ 11/30/2025, 10:44:58 PM ]

[INFO] Processing ../Results/liveinternet_ru
[INFO] Loaded data
[INFO] Detected [33m0[39m first-party ID leaking violations
[INFO] Detected [33m108[39m third-party ID synchronization violations
[INFO] Detected [33m0[39m browser fingerprinting functions
[INFO] Found network traffic towards [33m235[39m third-parties
[INFO] Processed website
[INFO] Stored data to ../Results/li

Error at https://nypost.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping nypost.com due to Crawler failure

üöÄ Processing website 256/400: elmundo.es

üîÅ Crawler attempt 1/1 for https://elmundo.es
Application Started: [ 11/30/2025, 10:46:51 PM ]

[INFO] Crawling https://elmundo.es
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/elmundo_es
Application Started: [ 11/30/2025, 10:47:10 PM ]

[INFO] Processing ../Results/elmundo_es
[INFO] Loaded data
[INFO] Detected [33m11[39m first-party ID leaking violations
[INFO] Detected [33m0[39m third-party ID synchronization violations
[INFO] Detected [33m0[39m browser fingerprinting functions
[INFO] Found network traffic towards [33m80[39m third-parties
[INFO] Processed website
[INFO] Stored data to ../Results/elmundo_es/result.json
‚úÖ De

Error at https://ipv4.google.com:  Error: Navigation failed because browser has disconnected!
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:51:147
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/vendor/mitt/src/index.js:51:62
    at Array.map (<anonymous>)
    at Object.emit [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/vendor/mitt/src/index.js:51:43[90m)[39m
    at CDPSession.emit [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/EventEmitter.js:72:22[90m)[39m
    at CDPSession._onClosed [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Connection.js:267:14[90m)[39m
    at Connection._onClose [90m(/Users/qie/Desktop/conse

[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping ipv4.google.com due to Crawler failure

üöÄ Processing website 259/400: deezer.com

üîÅ Crawler attempt 1/1 for https://deezer.com
Application Started: [ 11/30/2025, 10:47:35 PM ]

[INFO] Crawling https://deezer.com
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/deezer_com
Application Started: [ 11/30/2025, 10:47:47 PM ]

[INFO] Processing ../Results/deezer_com
[INFO] Loaded data
[INFO] Detected [33m0[39m first-party ID leaking violations
[INFO] Detected [33m0[39m third-party ID synchronization violations
[INFO] Detected [33m0[39m browser fingerprinting functions
[INFO] Found network traffic towards [33m7[39m third-parties
[INFO] Processed website
[INFO] Stored data to ../Results/deezer_com/result.json
‚úÖ

Operation failed for ../Results/t-online_de: Error: ENOENT: no such file or directory, open '../Results/t-online_de/cookies.json'
[90m    at Object.readFileSync (node:fs:441:20)[39m
    at LoadData [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mhelpers/storage.js:13:21[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:21:30[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:internal/modules/cjs/loader:1706:14)[39m
[90m    at Object..js (node:internal/modules/cjs/loader:1839:10)[39m
[90m    at Module.load (node:internal/modules/cjs/loader:1441:32)[39m
[90m    at Function._load (node:internal/module


üîÅ Detector attempt 2/3 for ../Results/t-online_de
Application Started: [ 11/30/2025, 10:50:07 PM ]

[INFO] Processing ../Results/t-online_de
‚ùå Detector failed, retrying...


Operation failed for ../Results/t-online_de: Error: ENOENT: no such file or directory, open '../Results/t-online_de/cookies.json'
[90m    at Object.readFileSync (node:fs:441:20)[39m
    at LoadData [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mhelpers/storage.js:13:21[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:21:30[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:internal/modules/cjs/loader:1706:14)[39m
[90m    at Object..js (node:internal/modules/cjs/loader:1839:10)[39m
[90m    at Module.load (node:internal/modules/cjs/loader:1441:32)[39m
[90m    at Function._load (node:internal/module


üîÅ Detector attempt 3/3 for ../Results/t-online_de
Application Started: [ 11/30/2025, 10:50:09 PM ]

[INFO] Processing ../Results/t-online_de
‚ùå Detector failed, retrying...


Operation failed for ../Results/t-online_de: Error: ENOENT: no such file or directory, open '../Results/t-online_de/cookies.json'
[90m    at Object.readFileSync (node:fs:441:20)[39m
    at LoadData [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mhelpers/storage.js:13:21[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:21:30[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:internal/modules/cjs/loader:1706:14)[39m
[90m    at Object..js (node:internal/modules/cjs/loader:1839:10)[39m
[90m    at Module.load (node:internal/modules/cjs/loader:1441:32)[39m
[90m    at Function._load (node:internal/module

‚õî Detector failed after 3 attempts
üö´ Skipping t-online.de due to Detector failure

üöÄ Processing website 270/400: telegra.ph

üîÅ Crawler attempt 1/1 for https://telegra.ph
Application Started: [ 11/30/2025, 10:50:11 PM ]

[INFO] Crawling https://telegra.ph
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/telegra_ph
Application Started: [ 11/30/2025, 10:50:20 PM ]

[INFO] Processing ../Results/telegra_ph
[INFO] Loaded data
[INFO] Detected [33m0[39m first-party ID leaking violations
[INFO] Detected [33m0[39m third-party ID synchronization violations
[INFO] Detected [33m0[39m browser fingerprinting functions
[INFO] Found network traffic towards [33m3[39m third-parties
[INFO] Processed website
[INFO] Stored data to ../Results/telegra_ph/result.json
‚úÖ Detector success

üöÄ Processing website 271/400: mega.nz



Error at https://usnews.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping usnews.com due to Crawler failure

üöÄ Processing website 273/400: plos.org

üîÅ Crawler attempt 1/1 for https://plos.org
Application Started: [ 11/30/2025, 10:51:20 PM ]

[INFO] Crawling https://plos.org
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/plos_org
Application Started: [ 11/30/2025, 10:51:35 PM ]

[INFO] Processing ../Results/plos_org
[INFO] Loaded data
[INFO] Detected [33m3[39m first-party ID leaking violations
[INFO] Detected [33m0[39m third-party ID synchronization violations
[INFO] Detected [33m0[39m browser fingerprinting functions
[INFO] Found network traffic towards [33m21[39m third-parties
[INFO] Processed website
[INFO] Stored data to ../Results/plos_org/result.json
‚úÖ Detector succes

Error at https://lefigaro.fr:  ProtocolError: Protocol error (Target.attachToTarget): Target closed.
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Connection.js:75:24
    at new Promise (<anonymous>)
    at Connection.send [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Connection.js:71:16[90m)[39m
    at Connection.createSession [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Connection.js:157:42[90m)[39m
    at Target._sessionFactory [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Browser.js:192:91[90m)[39m
    at Target.page [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Target.js:73:38[90m)[39m
    at [90m

‚õî Crawler failed after 3 attempts
üö´ Skipping lefigaro.fr due to Crawler failure

üöÄ Processing website 280/400: bp1.blogger.com

üîÅ Crawler attempt 1/1 for https://bp1.blogger.com
Application Started: [ 11/30/2025, 10:52:52 PM ]

[INFO] Crawling https://bp1.blogger.com
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/bp1_blogger_com
Application Started: [ 11/30/2025, 10:53:02 PM ]

[INFO] Processing ../Results/bp1_blogger_com
[INFO] Loaded data
[INFO] Detected [33m0[39m first-party ID leaking violations
[INFO] Detected [33m0[39m third-party ID synchronization violations
[INFO] Detected [33m0[39m browser fingerprinting functions
[INFO] Found network traffic towards [33m2[39m third-parties
[INFO] Processed website
[INFO] Stored data to ../Results/bp1_blogger_com/result.json
‚úÖ Detector success

üöÄ Processing

Error at https://nydailynews.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping nydailynews.com due to Crawler failure

üöÄ Processing website 284/400: themeforest.net

üîÅ Crawler attempt 1/1 for https://themeforest.net
Application Started: [ 11/30/2025, 10:54:14 PM ]

[INFO] Crawling https://themeforest.net
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/themeforest_net
Application Started: [ 11/30/2025, 10:54:25 PM ]

[INFO] Processing ../Results/themeforest_net
[INFO] Loaded data
[INFO] Detected [33m0[39m first-party ID leaking violations
[INFO] Detected [33m0[39m third-party ID synchronization violations
[INFO] Detected [33m0[39m browser fingerprinting functions
[INFO] Found network traffic towards [33m5[39m third-parties
[INFO] Processed website
[INFO] Stored data to ../Results/t

Error at https://rtve.es:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping rtve.es due to Crawler failure

üöÄ Processing website 286/400: newsweek.com

üîÅ Crawler attempt 1/1 for https://newsweek.com
Application Started: [ 11/30/2025, 10:55:10 PM ]

[INFO] Crawling https://newsweek.com
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/newsweek_com
Application Started: [ 11/30/2025, 10:55:22 PM ]

[INFO] Processing ../Results/newsweek_com
[INFO] Loaded data
[INFO] Detected [33m15[39m first-party ID leaking violations
[INFO] Detected [33m26[39m third-party ID synchronization violations
[INFO] Detected [33m0[39m browser fingerprinting functions
[INFO] Found network traffic towards [33m201[39m third-parties
[INFO] Processed website
[INFO] Stored data to ../Results/newsweek_com/result.

Error at https://ca.gov:  ProtocolError: Protocol error (Page.navigate): Target closed.
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Connection.js:226:24
    at new Promise (<anonymous>)
    at CDPSession.send [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/Connection.js:222:16[90m)[39m
    at navigate [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:148:47[90m)[39m
    at FrameManager.navigateFrame [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:131:13[90m)[39m
    at Frame.goto [90m(/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/FrameManager.js:500:41[90m)[39m
    at Page.goto [90m

[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping ca.gov due to Crawler failure

üöÄ Processing website 289/400: goodreads.com

üîÅ Crawler attempt 1/1 for https://goodreads.com
Application Started: [ 11/30/2025, 10:55:42 PM ]

[INFO] Crawling https://goodreads.com
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/goodreads_com
Application Started: [ 11/30/2025, 10:55:54 PM ]

[INFO] Processing ../Results/goodreads_com
[INFO] Loaded data
[INFO] Detected [33m1[39m first-party ID leaking violations
[INFO] Detected [33m1[39m third-party ID synchronization violations
[INFO] Detected [33m0[39m browser fingerprinting functions
[INFO] Found network traffic towards [33m29[39m third-parties
[INFO] Processed website
[INFO] Stored data to ../Results/goodreads_com/resul

Error at https://hindustantimes.com:  TimeoutError: Navigation timeout of 40000 ms exceeded
    at [90m/Users/qie/Desktop/consent-guard-main/Source/Crawler/[39mnode_modules/[4mpuppeteer[24m/lib/cjs/puppeteer/common/LifecycleWatcher.js:106:111


[ERROR] No traces collected
‚ùå Crawler failed, retrying...
‚õî Crawler failed after 3 attempts
üö´ Skipping hindustantimes.com due to Crawler failure

üöÄ Processing website 295/400: weibo.com

üîÅ Crawler attempt 1/1 for https://weibo.com
Application Started: [ 11/30/2025, 10:57:54 PM ]

[INFO] Crawling https://weibo.com
[INFO] Created browser instance
[INFO] Visiting website...
[INFO] Waiting...
[INFO] Collecting data...
[INFO] Storing data...
[INFO] Process complete
‚úÖ Crawler success

üîÅ Detector attempt 1/3 for ../Results/weibo_com
Application Started: [ 11/30/2025, 10:58:06 PM ]

[INFO] Processing ../Results/weibo_com
[INFO] Loaded data
[INFO] Detected [33m0[39m first-party ID leaking violations
[INFO] Detected [33m0[39m third-party ID synchronization violations
[INFO] Detected [33m0[39m browser fingerprinting functions
[INFO] Found network traffic towards [33m3[39m third-parties
[INFO] Processed website
[INFO] Stored data to ../Results/weibo_com/result.json
‚úÖ De

Operation failed for ../Results/e-monsite_com: Error: ENOENT: no such file or directory, open '../Results/e-monsite_com/cookies.json'
[90m    at Object.readFileSync (node:fs:441:20)[39m
    at LoadData [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mhelpers/storage.js:13:21[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:21:30[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:internal/modules/cjs/loader:1706:14)[39m
[90m    at Object..js (node:internal/modules/cjs/loader:1839:10)[39m
[90m    at Module.load (node:internal/modules/cjs/loader:1441:32)[39m
[90m    at Function._load (node:internal/mo


üîÅ Detector attempt 2/3 for ../Results/e-monsite_com
Application Started: [ 11/30/2025, 10:58:59 PM ]

[INFO] Processing ../Results/e-monsite_com
‚ùå Detector failed, retrying...


Operation failed for ../Results/e-monsite_com: Error: ENOENT: no such file or directory, open '../Results/e-monsite_com/cookies.json'
[90m    at Object.readFileSync (node:fs:441:20)[39m
    at LoadData [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mhelpers/storage.js:13:21[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:21:30[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:internal/modules/cjs/loader:1706:14)[39m
[90m    at Object..js (node:internal/modules/cjs/loader:1839:10)[39m
[90m    at Module.load (node:internal/modules/cjs/loader:1441:32)[39m
[90m    at Function._load (node:internal/mo


üîÅ Detector attempt 3/3 for ../Results/e-monsite_com
Application Started: [ 11/30/2025, 10:59:01 PM ]

[INFO] Processing ../Results/e-monsite_com
‚ùå Detector failed, retrying...


Operation failed for ../Results/e-monsite_com: Error: ENOENT: no such file or directory, open '../Results/e-monsite_com/cookies.json'
[90m    at Object.readFileSync (node:fs:441:20)[39m
    at LoadData [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mhelpers/storage.js:13:21[90m)[39m
    at Analyse [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:21:30[90m)[39m
    at ProcessWebsite [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:83:24[90m)[39m
    at main [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:121:28[90m)[39m
    at Object.<anonymous> [90m(/Users/qie/Desktop/consent-guard-main/Source/Detector/[39mapp.js:142:3[90m)[39m
[90m    at Module._compile (node:internal/modules/cjs/loader:1706:14)[39m
[90m    at Object..js (node:internal/modules/cjs/loader:1839:10)[39m
[90m    at Module.load (node:internal/modules/cjs/loader:1441:32)[39m
[90m    at Function._load (node:internal/mo

‚õî Detector failed after 3 attempts
üö´ Skipping e-monsite.com due to Detector failure

üöÄ Processing website 299/400: hubspot.com

üîÅ Crawler attempt 1/1 for https://hubspot.com
Application Started: [ 11/30/2025, 10:59:03 PM ]

[INFO] Crawling https://hubspot.com
[INFO] Created browser instance
[INFO] Visiting website...


KeyboardInterrupt: 