In [1]:
import requests
from bs4 import BeautifulSoup
from fake_useragent import UserAgent
import time

class SearchAgent:
    def __init__(self, country):
        self.country = country
        self.job_titles = [
            "CTO", "CEO", "Talent Acquisition", "HR Manager"
        ]
        self.industries = [
            "Generative AI", "Artificial Intelligence", "Machine Learning", "Software Companies"
        ]

    def get_profiles(self):
        headers = {"User-Agent": UserAgent().random}
        profiles = []

        for title in self.job_titles:
            for industry in self.industries:
                search_query = f"{title} {industry} {self.country} site:linkedin.com/in/"
                google_search_url = f"https://www.google.com/search?q={search_query}&num=20"

                response = requests.get(google_search_url, headers=headers)
                time.sleep(2)  # Avoid getting blocked

                if response.status_code == 200:
                    soup = BeautifulSoup(response.text, "html.parser")
                    for link in soup.find_all("a", href=True):
                        href = link["href"]
                        if "linkedin.com/in/" in href:
                            profile_link = href.split("&")[0].replace("/url?q=", "")
                            profiles.append(profile_link)

        return list(set(profiles))  # Remove duplicates


In [2]:
import re

class FilterAgent:
    def __init__(self, profiles):
        self.profiles = profiles

    def clean_profiles(self):
        unique_profiles = list(set(self.profiles))  # Remove duplicates
        return [profile for profile in unique_profiles if re.search(r"linkedin\.com/in/", profile)]


In [14]:
import autogen

# Initialize agents to search for AI industry leaders
search_agent = SearchAgent("USA")
profiles = search_agent.get_ctos()  # Get profiles (only LinkedIn URLs)

filter_agent = FilterAgent(profiles)
cleaned_profiles = filter_agent.clean_profiles()  # Clean & remove duplicates

# Print LinkedIn profile links
print("\n[✅] Extracted LinkedIn Profiles:")
for profile in cleaned_profiles:
    print(profile)



[✅] Extracted LinkedIn Profiles:
/search?q=CTO+USA+site:linkedin.com/in/


In [17]:
# Initialize agents
search_agent = SearchAgent("USA")
profiles = search_agent.get_profiles()  # Get LinkedIn profile links

# Print the results
print("\n[✅] Extracted LinkedIn Profiles:")
for profile in profiles:
    print(profile)



[✅] Extracted LinkedIn Profiles:
/search?q=CEO+Machine+Learning+USA+site:linkedin.com/in/
/search?q=CTO+Generative+AI+USA+site:linkedin.com/in/
/search?q=HR+Manager+Generative+AI+USA+site:linkedin.com/in/
/search?q=HR+Manager+Artificial+Intelligence+USA+site:linkedin.com/in/
/search?q=CTO+Artificial+Intelligence+USA+site:linkedin.com/in/
/search?q=CTO+Machine+Learning+USA+site:linkedin.com/in/
/search?q=Talent+Acquisition+Generative+AI+USA+site:linkedin.com/in/
/search?q=CEO+Artificial+Intelligence+USA+site:linkedin.com/in/
/search?q=Talent+Acquisition+Artificial+Intelligence+USA+site:linkedin.com/in/
/search?q=CEO+Generative+AI+USA+site:linkedin.com/in/
/search?q=HR+Manager+Software+Companies+USA+site:linkedin.com/in/
/search?q=CTO+Software+Companies+USA+site:linkedin.com/in/
/search?q=HR+Manager+Machine+Learning+USA+site:linkedin.com/in/
/search?q=CEO+Software+Companies+USA+site:linkedin.com/in/
/search?q=Talent+Acquisition+Machine+Learning+USA+site:linkedin.com/in/
/search?q=Talent

In [19]:
import requests
from bs4 import BeautifulSoup
from fake_useragent import UserAgent
import pandas as pd
import time

class SearchAgent:
    def __init__(self, country):
        self.country = country
        self.job_titles = ["CTO", "CEO", "Talent Acquisition", "HR Manager"]
        self.industries = ["Generative AI", "Artificial Intelligence", "Machine Learning", "Software Companies"]
        self.search_engine_url = "https://www.bing.com/search?q="  # Use Bing instead of Google

    def get_profiles(self):
        headers = {"User-Agent": UserAgent().random}
        profiles = []

        for title in self.job_titles:
            for industry in self.industries:
                search_query = f"{title} {industry} {self.country} site:linkedin.com/in/"
                response = requests.get(f"{self.search_engine_url}{search_query}&count=50", headers=headers)
                time.sleep(3)  # Avoid getting blocked

                if response.status_code == 200:
                    soup = BeautifulSoup(response.text, "html.parser")
                    for link in soup.find_all("a", href=True):
                        href = link["href"]
                        if "linkedin.com/in/" in href:
                            profiles.append(href)  # Direct LinkedIn profile link

        return list(set(profiles))  # Remove duplicates

    def save_to_csv(self, profiles, filename="linkedin_profiles.csv"):
        df = pd.DataFrame(profiles, columns=["LinkedIn Profile"])
        df.to_csv(filename, index=False)
        print(f"[✅] Profiles saved to {filename}")


In [20]:
# Initialize search for AI industry leaders
search_agent = SearchAgent("USA")
profiles = search_agent.get_profiles()  # Get multiple LinkedIn profile links

# Print results
print("\n[✅] Extracted LinkedIn Profiles:")
for profile in profiles:
    print(profile)

# Save to CSV for later use
search_agent.save_to_csv(profiles)


[✅] Extracted LinkedIn Profiles:
https://www.linkedin.com/in/anthony-melatti-8284a46b
https://www.linkedin.com/in/harrison-m-8990721b8
https://www.linkedin.com/in/satya-shah
https://www.linkedin.com/in/zhengping-ji-494649b
https://www.linkedin.com/in/ashishgandotra
https://www.linkedin.com/in/rohit-tiwari-907387204
https://www.linkedin.com/in/tahak
https://www.linkedin.com/in/vijay0
https://www.linkedin.com/in/sameersingh
https://www.linkedin.com/in/davidtalby
https://www.linkedin.com/in/andrew-fausak-a43631
https://www.linkedin.com/in/gmlander
https://www.linkedin.com/in/james-tooles
https://www.linkedin.com/in/jim-miller-mba-bb2ab43
https://www.linkedin.com/in/jeremystanley
https://www.linkedin.com/in/phillip-middleton-b69b2825
https://www.linkedin.com/in/anis-hamdi-872067181
https://www.linkedin.com/in/julia-filiberti-allen
https://www.linkedin.com/in/ztoa
https://www.linkedin.com/in/mateizaharia
[✅] Profiles saved to linkedin_profiles.csv
