In [1]:
import pandas as pd
import numpy as np
import re
import ast
import os 
from dotenv import load_dotenv

# Load environment variables from the .env file
load_dotenv()
ANTHROPIC_API_KEY = os.getenv('ANTHROPIC_API_KEY')

# Set Pandas options to display full text for all columns
pd.set_option('display.max_colwidth', None)
pd.set_option('display.max_columns', None)  # Show all columns


In [2]:
# Load the dataset from the './data' folder
people_path = './data/YC F24 Founder People.csv'

# Read data into pandas DataFrame
people_data = pd.read_csv(people_path)

# Relevant columns to keep
relevant_columns = [
    'full_name', 'title', 'location', 'company', 'company_linkedin', 
    'company_description', 'sub_title', 'summary', 'current_job_description', 
    'person_industry', 'skills', 'education', 'work_history'
]

# Filter the relevant columns
people_filtered = people_data[relevant_columns]

# Display basic information about the dataset
print("Dataset Loaded:")
display(people_filtered.head())


Dataset Loaded:


Unnamed: 0,full_name,title,location,company,company_linkedin,company_description,sub_title,summary,current_job_description,person_industry,skills,education,work_history
0,Edward Aryee,Co-Founder & CTO,"San Francisco Bay, San Francisco Bay Area, United States of America",SRE.ai (YC F24),https://www.linkedin.com/company/104394435/,,Co-Founder & CTO at SRE.ai (YC F24) | ex-Google,,An AI-powered automation platform for Salesforce development teams.,Software Development,"[""Programming"", ""Python"", ""Java"", ""JavaScript"", ""Matlab"", ""Computer Science"", ""Public Speaking""]","[{""date"":{""start"":{""month"":null,""year"":null,""day"":null},""end"":{""month"":null,""year"":null,""day"":null}},""school"":{""name"":""Drexel University"",""logo"":""https://media.licdn.com/dms/image/v2/C510BAQEqp_nXWmHi6Q/company-logo_400_400/company-logo_400_400/0/1631320003902?e=1740614400&v=beta&t=V5sjIC9C8zYonL2o9_NBkJWzeRu-9_XNIFQKCWmgGzE"",""url"":""https://www.linkedin.com/company/5164/""},""degree_name"":""B.S. Computer Science"",""field_of_study"":""B.S. Computer Science"",""description"":null}]","[{""company"":{""id"":104394435,""name"":""SRE.ai (YC F24)"",""logo"":""https://media.licdn.com/dms/image/v2/D560BAQFgYyZbiA64pw/company-logo_400_400/company-logo_400_400/0/1731048003973/sreai_logo?e=1740614400&v=beta&t=2SPj0iQU8dTrHco4EIqUSqF6wYn5IxQfx66et9B2e7w"",""url"":""https://www.linkedin.com/company/104394435/""},""date"":{""start"":{""month"":10,""year"":2024,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""profile_positions"":[{""location"":""San Francisco, California, United States"",""date"":{""start"":{""month"":10,""year"":2024,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""company"":""SRE.ai (YC F24)"",""description"":""An AI-powered automation platform for Salesforce development teams."",""title"":""Co-Founder & CTO"",""employment_type"":""Full-time""}]},{""company"":{""id"":86046410,""name"":""Black Angel Group (BAG)"",""logo"":""https://media.licdn.com/dms/image/v2/D560BAQGlQJ3RvtjVPg/company-logo_400_400/company-logo_400_400/0/1686966482606?e=1740614400&v=beta&t=ucPVKqQPwAhklwXiaeUq3ey4WS95PeEupNtwdQkz6n4"",""url"":""https://www.linkedin.com/company/86046410/""},""date"":{""start"":{""month"":12,""year"":2022,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":12,""year"":2022,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""company"":""Black Angel Group (BAG)"",""description"":""Investing intellectual, social and financial capital in seed to Series A startups around the world. Our collective believes in founders who build ethical, high-growth technology companies."",""title"":""Angel Investor"",""employment_type"":null}]},{""company"":{""id"":1441,""name"":""Google"",""logo"":""https://media.licdn.com/dms/image/v2/C4D0BAQHiNSL4Or29cg/company-logo_400_400/company-logo_400_400/0/1631311446380?e=1740614400&v=beta&t=mjYwrMVLDtBnx1lXZ5L-t56YLcXTQWE_ER5LG9AvP5w"",""url"":""https://www.linkedin.com/company/1441/""},""date"":{""start"":{""month"":7,""year"":2018,""day"":null},""end"":{""month"":9,""year"":2024,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":1,""year"":2022,""day"":null},""end"":{""month"":9,""year"":2024,""day"":null}},""company"":""Google"",""description"":"""",""title"":""Senior Software Engineer and Tech Lead, Search (Translate) "",""employment_type"":null},{""location"":null,""date"":{""start"":{""month"":6,""year"":2023,""day"":null},""end"":{""month"":6,""year"":2024,""day"":null}},""company"":""Google"",""description"":"""",""title"":""Startup & VC Engagement Lead, Bay Area"",""employment_type"":null},{""location"":null,""date"":{""start"":{""month"":1,""year"":2023,""day"":null},""end"":{""month"":6,""year"":2023,""day"":null}},""company"":""Google"",""description"":"""",""title"":""Startup & VC Engagement Manager"",""employment_type"":null},{""location"":null,""date"":{""start"":{""month"":1,""year"":2020,""day"":null},""end"":{""month"":1,""year"":2022,""day"":null}},""company"":""Google"",""description"":"""",""title"":""Senior Software Engineer, Research "",""employment_type"":null},{""location"":null,""date"":{""start"":{""month"":7,""year"":2018,""day"":null},""end"":{""month"":1,""year"":2020,""day"":null}},""company"":""Google"",""description"":"""",""title"":""Software Engineer"",""employment_type"":null}]},{""company"":{""id"":1035,""name"":""Microsoft"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQE88xCsONDULQ/company-logo_400_400/company-logo_400_400/0/1630652622688/microsoft_logo?e=1740614400&v=beta&t=qmRiI_WPTCUwX9L1YFf-TgzP0iUVb9I3_eMlESIlcFQ"",""url"":""https://www.linkedin.com/company/1035/""},""date"":{""start"":{""month"":6,""year"":2017,""day"":null},""end"":{""month"":3,""year"":2018,""day"":null}},""profile_positions"":[{""location"":""Cambridge, Massachusetts"",""date"":{""start"":{""month"":6,""year"":2017,""day"":null},""end"":{""month"":3,""year"":2018,""day"":null}},""company"":""Microsoft"",""description"":""Developed and launched Ink to Code, an AI solution for transferring rapid sketches with Surface Ink Pen into real code for cross-platform apps. Created with a team of only interns, from initial idea to production in one summer."",""title"":""Software Engineer"",""employment_type"":null}]},{""company"":{""id"":3632554,""name"":""StratIS IoT"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQEmtd8bqBk4ug/company-logo_400_400/company-logo_400_400/0/1654196616542/stratis_iot_logo?e=1740614400&v=beta&t=j5-rG1DxGQa0C4pmXU1g5HQLxLyfsnVlmd4U8RCdQaE"",""url"":""https://www.linkedin.com/company/3632554/""},""date"":{""start"":{""month"":3,""year"":2017,""day"":null},""end"":{""month"":5,""year"":2017,""day"":null}},""profile_positions"":[{""location"":""Philadelphia, Pennsylvania"",""date"":{""start"":{""month"":3,""year"":2017,""day"":null},""end"":{""month"":5,""year"":2017,""day"":null}},""company"":""StratIS IoT"",""description"":""STRATIS® was later acquired by RealPage. Built the first integration with Schlage wireless Smart Lock technology in V1 of the Stratis App. Built maintenance request submission and ticketing system for multifamily and student housing building management."",""title"":""Software Engineer"",""employment_type"":null}]},{""company"":{""id"":2477895,""name"":""Web Presence in China"",""logo"":""https://media.licdn.com/dms/image/v2/C4E0BAQGo35F92R-1dg/company-logo_400_400/company-logo_400_400/0/1630595140642/wpic_logo?e=1740614400&v=beta&t=IjtZ_OZakWByAgP2LiliZS1RfYqHlYthU_5Tjb4GCPs"",""url"":""https://www.linkedin.com/company/2477895/""},""date"":{""start"":{""month"":4,""year"":2016,""day"":null},""end"":{""month"":9,""year"":2016,""day"":null}},""profile_positions"":[{""location"":""Beijing, China"",""date"":{""start"":{""month"":4,""year"":2016,""day"":null},""end"":{""month"":9,""year"":2016,""day"":null}},""company"":""Web Presence in China"",""description"":""Developed utilities responsible for access and analysis of website content used by Fortune 200 companies. Published an open-source module for testing, translating, and publishing MithrilJS components"",""title"":""Software Engineering Co-op"",""employment_type"":null}]},{""company"":{""id"":726936,""name"":""BuLogics"",""logo"":""https://media.licdn.com/dms/image/v2/C4D0BAQEUYsZQrbbLGw/company-logo_400_400/company-logo_400_400/0/1631312147393?e=1740614400&v=beta&t=ZxQBqPn33euYz5nxtWD8ogQ89nEKPBg_tE39Iwjx7Xg"",""url"":""https://www.linkedin.com/company/726936/""},""date"":{""start"":{""month"":4,""year"":2015,""day"":null},""end"":{""month"":11,""year"":2015,""day"":null}},""profile_positions"":[{""location"":""Philadelphia, Pennsylvania"",""date"":{""start"":{""month"":4,""year"":2015,""day"":null},""end"":{""month"":11,""year"":2015,""day"":null}},""company"":""BuLogics"",""description"":""Entirely recreated the Vigzul home security mobile application, transferring it from native iOS to cross-platform, improving efficiency and usability."",""title"":""Cross Platform Developer Co-op"",""employment_type"":null}]},{""company"":{""id"":null,""name"":""Virtual Pantry"",""logo"":null,""url"":""https://www.linkedin.com/search/results/all/?keywords=Virtual+Pantry""},""date"":{""start"":{""month"":3,""year"":2014,""day"":null},""end"":{""month"":1,""year"":2015,""day"":null}},""profile_positions"":[{""location"":""Philadelphia, Pennsylvania, United States"",""date"":{""start"":{""month"":3,""year"":2014,""day"":null},""end"":{""month"":1,""year"":2015,""day"":null}},""company"":""Virtual Pantry"",""description"":""Co-founder of Virtual Pantry, a mobile application digitizing parts of the cooking prep experience. Backed by Drexel University Close School of Entrepreneurship.\n\nMaintain a list of ingredients in your kitchen and easily search for recipes with filters for allergies and dietary needs. One-click grocery list creation based on what you have and what you want to cook!"",""title"":""Co-Founder, Software Engineer"",""employment_type"":""Self-employed""}]},{""company"":{""id"":2624,""name"":""Columbia University"",""logo"":""https://media.licdn.com/dms/image/v2/C4E0BAQFxn78nvVaTDA/company-logo_400_400/company-logo_400_400/0/1630638452046/columbia_university_logo?e=1740614400&v=beta&t=kSxBiUJsV3sCkq-Y1-plsWjjoqj3anUIQoqQcz6Gd3Q"",""url"":""https://www.linkedin.com/company/2624/""},""date"":{""start"":{""month"":5,""year"":2011,""day"":null},""end"":{""month"":5,""year"":2013,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":5,""year"":2011,""day"":null},""end"":{""month"":5,""year"":2013,""day"":null}},""company"":""Columbia University"",""description"":""Research assistant under Dr. Kartik Chandran of Columbia University"",""title"":""Research Intern"",""employment_type"":null}]}]"
1,Victor Cheng,Co-Founder and CEO,"San Francisco, California, United States of America",vly.ai (YC F24),https://www.linkedin.com/company/99356232/,,co-founder @ vly.ai (YC F24),cooking,The easiest way to build custom full-stack software without code. Backed by Y Combinator,Software Development,"[""Startups"", ""TypeScript"", ""Git"", ""Express.js"", ""MongoDB"", ""Full-Stack Development"", ""Node.js"", ""Competitive Programming"", ""Next.js"", ""Software Development"", ""React.js"", ""C++"", ""JavaScript"", ""C#"", ""Java"", ""Unity3D"", ""Business"", ""Mathematics"", ""Robotics"", ""Mobile Application Development"", ""Android Studio""]","[{""date"":{""start"":{""month"":9,""year"":2022,""day"":null},""end"":{""month"":null,""year"":null,""day"":null}},""school"":{""name"":""University of Washington"",""logo"":""https://media.licdn.com/dms/image/v2/C4D0BAQEMmhF9TqUCgA/company-logo_400_400/company-logo_400_400/0/1630545704089/university_of_washington_logo?e=1740614400&v=beta&t=aasGmKsnzSlETq4R656LLVoSHB4_KTl7DY8kqkH55iQ"",""url"":""https://www.linkedin.com/company/2584/""},""degree_name"":""Bachelor of Science - BS, Computer Science & Entrepreneurship"",""field_of_study"":""Bachelor of Science - BS, Computer Science & Entrepreneurship"",""description"":""Dubhacks Next Startup Incubator Program, Entrepreneur in Residence\nHusky Running Club Elected Technology Officer\nLavin Entrepreneurship Program""},{""date"":{""start"":{""month"":1,""year"":2018,""day"":null},""end"":{""month"":1,""year"":2022,""day"":null}},""school"":{""name"":""Skyline High School"",""logo"":""https://media.licdn.com/dms/image/v2/C4E0BAQH-8yO5gkDCzQ/company-logo_400_400/company-logo_400_400/0/1630582324933?e=1740614400&v=beta&t=vsELTy4vlYBa18qbgmxVyIfSrN4vPoVYm5gnVpcUnNc"",""url"":""https://www.linkedin.com/company/34217292/""},""degree_name"":""High School Diploma, IB Diploma"",""field_of_study"":""High School Diploma, IB Diploma"",""description"":""IB Diploma | 4.0 Unweighted GPA | 36 ACT\nSkyline Robotics Software Lead\nVarsity Cross Country\nVarsity Mock Trial\n3-time AIME Qualifier\nUSACO Gold\nEagle Scout""},{""date"":{""start"":{""month"":9,""year"":2024,""day"":null},""end"":{""month"":null,""year"":null,""day"":null}},""school"":{""name"":""Y Combinator"",""logo"":""https://media.licdn.com/dms/image/v2/C4D0BAQGPzdBPNxrmEg/company-logo_400_400/company-logo_400_400/0/1673555093250/y_combinator_logo?e=1740614400&v=beta&t=IkWVzeoerUDjMi0gmzWEkNZvM23worfLYr1CjmAOWCM"",""url"":""https://www.linkedin.com/company/167872/""},""degree_name"":""F24"",""field_of_study"":""F24"",""description"":""vly.ai (YC F24)""}]","[{""company"":{""id"":99356232,""name"":""vly.ai (YC F24)"",""logo"":""https://media.licdn.com/dms/image/v2/D560BAQHSBsQNp4nbiQ/company-logo_400_400/company-logo_400_400/0/1730702869448/vly_ai_logo?e=1740614400&v=beta&t=EV2ju4ZhTCXTzq5hFsQlnBagrECrd86dnvS0yUFWVwA"",""url"":""https://www.linkedin.com/company/99356232/""},""date"":{""start"":{""month"":5,""year"":2024,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""profile_positions"":[{""location"":""San Francisco Bay Area"",""date"":{""start"":{""month"":5,""year"":2024,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""company"":""vly.ai (YC F24)"",""description"":""The easiest way to build custom full-stack software without code. Backed by Y Combinator"",""title"":""Co-Founder and CEO"",""employment_type"":null}]},{""company"":{""id"":10356344,""name"":""Hatch Coding"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQHUY2Ltzhuemw/company-logo_400_400/company-logo_400_400/0/1630669969906/hatchcoding_logo?e=1740614400&v=beta&t=cUNFqfU1RMl7CkCbxqgNELXZET25IrwMtr9XtiWA_6E"",""url"":""https://www.linkedin.com/company/10356344/""},""date"":{""start"":{""month"":10,""year"":2023,""day"":null},""end"":{""month"":5,""year"":2024,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":10,""year"":2023,""day"":null},""end"":{""month"":5,""year"":2024,""day"":null}},""company"":""Hatch Coding"",""description"":""Creating the next generation of educational software in the field of AI to gamify learning and make it enjoyable for all. Hoping to pave the way to new careers for students through a better way to learn."",""title"":""Software Engineer"",""employment_type"":""Part-time""}]},{""company"":{""id"":90635835,""name"":""Minute Land"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQFNT2A9KjMDbA/company-logo_400_400/company-logo_400_400/0/1678435140369?e=1740614400&v=beta&t=170cT5qh4w5FZRjbtQADH8Ak-k_KA0uolkm2RrcR82U"",""url"":""https://www.linkedin.com/company/90635835/""},""date"":{""start"":{""month"":11,""year"":2022,""day"":null},""end"":{""month"":4,""year"":2024,""day"":null}},""profile_positions"":[{""location"":""Seattle, Washington, United States"",""date"":{""start"":{""month"":11,""year"":2022,""day"":null},""end"":{""month"":4,""year"":2024,""day"":null}},""company"":""Minute Land"",""description"":""Created the technology behind Minute Land (https://minute.land), an off-grid land marketplace that makes the dream of land ownership affordable through subdivided plots starting as low as $100."",""title"":""Founding Engineer"",""employment_type"":""Part-time""}]},{""company"":{""id"":91376357,""name"":""Quantum Labs"",""logo"":""https://media.licdn.com/dms/image/v2/D560BAQFj1AKTPkTlWA/company-logo_400_400/company-logo_400_400/0/1695510001779/quantum_labs_nonprofit_logo?e=1740614400&v=beta&t=X1Wz3HtKSG4lWdTkAJPaAQE0avkUUeiqdJ1612GeCZE"",""url"":""https://www.linkedin.com/company/91376357/""},""date"":{""start"":{""month"":4,""year"":2023,""day"":null},""end"":{""month"":10,""year"":2023,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":4,""year"":2023,""day"":null},""end"":{""month"":10,""year"":2023,""day"":null}},""company"":""Quantum Labs"",""description"":""Acquired in October 2023 by Hatch Coding. An EdTech Startup focused on making AI learning fun and enjoyable for students."",""title"":""Founder"",""employment_type"":null}]},{""company"":{""id"":1879,""name"":""Autodesk"",""logo"":""https://media.licdn.com/dms/image/v2/D560BAQGrSi2UOCdL5g/company-logo_400_400/company-logo_400_400/0/1719952472030/autodesk_logo?e=1740614400&v=beta&t=oMbikFCSfM2uZ4lxQB6P3dcqF3IpfhSzMS9H_HKIbeg"",""url"":""https://www.linkedin.com/company/1879/""},""date"":{""start"":{""month"":6,""year"":2021,""day"":null},""end"":{""month"":9,""year"":2022,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":6,""year"":2021,""day"":null},""end"":{""month"":9,""year"":2022,""day"":null}},""company"":""Autodesk"",""description"":""Software Engineer for the Autodesk Synthesis Engine Team. Worked directly on a 3D robotics simulation platform."",""title"":""Software Engineer"",""employment_type"":""Internship""}]},{""company"":{""id"":64869164,""name"":""FRC Team 2976, Spartabots"",""logo"":""https://media.licdn.com/dms/image/v2/C4E0BAQEKkulRRFq1IQ/company-logo_400_400/company-logo_400_400/0/1630589404426?e=1740614400&v=beta&t=YEaOZQdBPkyDMzZVS6YORSrrqrYaRuWUV_9fnHDKt4U"",""url"":""https://www.linkedin.com/company/64869164/""},""date"":{""start"":{""month"":6,""year"":2021,""day"":null},""end"":{""month"":6,""year"":2022,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":6,""year"":2021,""day"":null},""end"":{""month"":6,""year"":2022,""day"":null}},""company"":""FRC Team 2976, Spartabots"",""description"":""In charge of the programming sector for FRC Team 2976. Multiple world championship titles."",""title"":""Software Lead"",""employment_type"":""Seasonal""}]},{""company"":{""id"":null,""name"":""Self-employed"",""logo"":null,""url"":""https://www.linkedin.com/search/results/all/?keywords=Self-employed""},""date"":{""start"":{""month"":7,""year"":2018,""day"":null},""end"":{""month"":5,""year"":2022,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":2,""year"":2018,""day"":null},""end"":{""month"":5,""year"":2022,""day"":null}},""company"":""Self-employed"",""description"":""Programmed dozens of in-depth and complex apps and games with thousands of downloads on iOS and Android. Managed all aspects of marketing, business, growth, and development."",""title"":""App & Game Developer"",""employment_type"":null},{""location"":""Sammamish, Washington, United States"",""date"":{""start"":{""month"":7,""year"":2018,""day"":null},""end"":{""month"":9,""year"":2020,""day"":null}},""company"":""Self-employed"",""description"":""I created multiple small-businesses and entrepreneurial ventures in the field of retail. Four-figure exit."",""title"":""Business Manager"",""employment_type"":null}]}]"
2,Daryl Budiman,Co-Founder & CEO,"San Francisco Bay, San Francisco Bay Area, United States of America",Andoria (YC F24),https://www.linkedin.com/company/102953213/,,Co-Founder at Andoria (YC F24) | Prev. MultiOn & Stanford,Imagine if you didn't have to learn any piece of software anymore.,"Backed by YC, among other great investors.","Technology, Information and Internet","[""Customer Onboarding"", ""Customer Success"", ""SwiftUI"", ""C++"", ""React.js"", ""Microsoft PowerPoint"", ""HTML"", ""CSS"", ""JavaScript"", ""Python"", ""Presentation Skills"", ""Public Speaking"", ""Adobe Photoshop"", ""Research"", ""ArcGIS"", ""Figma"", ""Leadership"", ""User Interface Design"", ""Computer-Aided Design (CAD)"", ""Autodesk Fusion 360""]","[{""date"":{""start"":{""month"":null,""year"":null,""day"":null},""end"":{""month"":null,""year"":null,""day"":null}},""school"":{""name"":""Stanford University"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQHr9suxyJBXMw/company-logo_400_400/company-logo_400_400/0/1635534378870/stanford_university_logo?e=1740614400&v=beta&t=jUvD393txVFjXC99hgAnTaWMx1lc2T_PEvkxHShNG5E"",""url"":""https://www.linkedin.com/company/1792/""},""degree_name"":""Bachelor of Science - BS, Symbolic Systems"",""field_of_study"":""Bachelor of Science - BS, Symbolic Systems"",""description"":null},{""date"":{""start"":{""month"":null,""year"":null,""day"":null},""end"":{""month"":null,""year"":null,""day"":null}},""school"":{""name"":""Y Combinator"",""logo"":""https://media.licdn.com/dms/image/v2/C4D0BAQGPzdBPNxrmEg/company-logo_400_400/company-logo_400_400/0/1673555093250/y_combinator_logo?e=1740614400&v=beta&t=IkWVzeoerUDjMi0gmzWEkNZvM23worfLYr1CjmAOWCM"",""url"":""https://www.linkedin.com/company/167872/""},""degree_name"":""F24"",""field_of_study"":""F24"",""description"":null}]","[{""company"":{""id"":102953213,""name"":""Andoria (YC F24)"",""logo"":""https://media.licdn.com/dms/image/v2/D560BAQGynXFMqzMzjQ/company-logo_400_400/company-logo_400_400/0/1730097880527/andoriaai_logo?e=1740614400&v=beta&t=j7A_jaCfQ3QRUx8Q2S90d-DS0KBKHkkWtx6FhVycEpg"",""url"":""https://www.linkedin.com/company/102953213/""},""date"":{""start"":{""month"":1,""year"":2024,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""profile_positions"":[{""location"":""San Francisco Bay Area"",""date"":{""start"":{""month"":1,""year"":2024,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""company"":""Andoria (YC F24)"",""description"":""Backed by YC, among other great investors."",""title"":""Co-Founder & CEO"",""employment_type"":null}]},{""company"":{""id"":95719778,""name"":""MultiOn"",""logo"":""https://media.licdn.com/dms/image/v2/D4E0BAQEy938dZY3oRQ/company-logo_400_400/company-logo_400_400/0/1702667475712/multionai_logo?e=1740614400&v=beta&t=KaJ7wt00-kT3jqbNQjxVEVy-RVtrwN0Ql_k3V8Fg9s4"",""url"":""https://www.linkedin.com/company/95719778/""},""date"":{""start"":{""month"":1,""year"":2023,""day"":null},""end"":{""month"":1,""year"":2024,""day"":null}},""profile_positions"":[{""location"":""Palo Alto, California, United States"",""date"":{""start"":{""month"":1,""year"":2023,""day"":null},""end"":{""month"":1,""year"":2024,""day"":null}},""company"":""MultiOn"",""description"":""AI web agents. Backed by General Catalyst, Amazon, Samsung, and more."",""title"":""Founding Designer"",""employment_type"":null}]},{""company"":{""id"":1586,""name"":""Amazon"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQHTvZwCx4p2Qg/company-logo_400_400/company-logo_400_400/0/1630640869849/amazon_logo?e=1740614400&v=beta&t=gbBBG91ElkMyDZw3x00xrkgmJf3OJ59EXPV5IDymhLc"",""url"":""https://www.linkedin.com/company/1586/""},""date"":{""start"":{""month"":1,""year"":2023,""day"":null},""end"":{""month"":1,""year"":2023,""day"":null}},""profile_positions"":[{""location"":""Seattle, Washington, United States"",""date"":{""start"":{""month"":1,""year"":2023,""day"":null},""end"":{""month"":1,""year"":2023,""day"":null}},""company"":""Amazon"",""description"":"""",""title"":""Design"",""employment_type"":null}]},{""company"":{""id"":35534053,""name"":""The Marriage Pact"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQF415KCAJh1Gw/company-logo_400_400/company-logo_400_400/0/1630650815060/marriage_pact_logo?e=1740614400&v=beta&t=2ZacZG027yTeJrpjOAccjGzhVJJPaKR8HHXB-f6Kf84"",""url"":""https://www.linkedin.com/company/35534053/""},""date"":{""start"":{""month"":1,""year"":2022,""day"":null},""end"":{""month"":1,""year"":2023,""day"":null}},""profile_positions"":[{""location"":""San Francisco Bay Area"",""date"":{""start"":{""month"":1,""year"":2022,""day"":null},""end"":{""month"":1,""year"":2023,""day"":null}},""company"":""The Marriage Pact"",""description"":"""",""title"":""PM"",""employment_type"":null}]},{""company"":{""id"":62953,""name"":""Evernote"",""logo"":""https://media.licdn.com/dms/image/v2/C4D0BAQGfbcKw53FGDQ/company-logo_400_400/company-logo_400_400/0/1630510668469/evernote_logo?e=1740614400&v=beta&t=S9a0A_vz6kt_mgV0UDtw_b56Gy2ZKu1ySKNmp7j4VFQ"",""url"":""https://www.linkedin.com/company/62953/""},""date"":{""start"":{""month"":1,""year"":2022,""day"":null},""end"":{""month"":1,""year"":2022,""day"":null}},""profile_positions"":[{""location"":""New York, United States"",""date"":{""start"":{""month"":1,""year"":2022,""day"":null},""end"":{""month"":1,""year"":2022,""day"":null}},""company"":""Evernote"",""description"":"""",""title"":""Design"",""employment_type"":null}]},{""company"":{""id"":34581506,""name"":""Matcha"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQFC0TTrEVrBog/company-logo_400_400/company-logo_400_400/0/1673858027862?e=1740614400&v=beta&t=e_jQdR3olNYChELVmP2b3g2zbZ4FZn6IcOROYWSNju0"",""url"":""https://www.linkedin.com/company/34581506/""},""date"":{""start"":{""month"":1,""year"":2021,""day"":null},""end"":{""month"":1,""year"":2022,""day"":null}},""profile_positions"":[{""location"":""New York, United States"",""date"":{""start"":{""month"":1,""year"":2021,""day"":null},""end"":{""month"":1,""year"":2022,""day"":null}},""company"":""Matcha"",""description"":"""",""title"":""Design Engineer"",""employment_type"":null}]},{""company"":{""id"":1790,""name"":""Stanford University School of Medicine"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQH74V3iDB5G5Q/company-logo_400_400/company-logo_400_400/0/1630632331199/stanford_university_school_of_medicine_logo?e=1740614400&v=beta&t=juxwnyJQrjswWSI4ZSbjvvInZt7yU7zhs246xC-_SA4"",""url"":""https://www.linkedin.com/company/1790/""},""date"":{""start"":{""month"":1,""year"":2021,""day"":null},""end"":{""month"":1,""year"":2021,""day"":null}},""profile_positions"":[{""location"":""Stanford, California, United States"",""date"":{""start"":{""month"":1,""year"":2021,""day"":null},""end"":{""month"":1,""year"":2021,""day"":null}},""company"":""Stanford University School of Medicine"",""description"":"""",""title"":""Research Assistant"",""employment_type"":null}]}]"
3,Finn Mallery,Co-Founder,"Palo Alto, California, United States of America",Origami Agents (YC F24),https://www.linkedin.com/company/99440945/,,Co-Founder @ Origami Agents (YC F24),,,"Technology, Information and Internet",[],"[{""date"":{""start"":{""month"":null,""year"":null,""day"":null},""end"":{""month"":null,""year"":null,""day"":null}},""school"":{""name"":""Stanford University"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQHr9suxyJBXMw/company-logo_400_400/company-logo_400_400/0/1635534378870/stanford_university_logo?e=1740614400&v=beta&t=jUvD393txVFjXC99hgAnTaWMx1lc2T_PEvkxHShNG5E"",""url"":""https://www.linkedin.com/company/1792/""},""degree_name"":""Bachelor of Science with Honors, Mathematics and Computational Science"",""field_of_study"":""Bachelor of Science with Honors, Mathematics and Computational Science"",""description"":null},{""date"":{""start"":{""month"":null,""year"":null,""day"":null},""end"":{""month"":null,""year"":null,""day"":null}},""school"":{""name"":""Stanford University School of Engineering"",""logo"":""https://media.licdn.com/dms/image/v2/C4E0BAQGBk9nVkNx7og/company-logo_400_400/company-logo_400_400/0/1631342355719?e=1740614400&v=beta&t=Gmvct7a8l1SCVxDqhBTbj508hCfMs6vMLneUk6yKy-I"",""url"":""https://www.linkedin.com/company/16266013/""},""degree_name"":""Master of Science - MS"",""field_of_study"":""Master of Science - MS"",""description"":""On leave""},{""date"":{""start"":{""month"":null,""year"":null,""day"":null},""end"":{""month"":null,""year"":null,""day"":null}},""school"":{""name"":""Z Fellows"",""logo"":""https://media.licdn.com/dms/image/v2/D4D0BAQGxt8rf67zIHw/company-logo_400_400/company-logo_400_400/0/1690772534719/zfellows_logo?e=1740614400&v=beta&t=XscUMNZUkq2mnznNg3N55Q9FO0epBUQrcGW0AVcBuys"",""url"":""https://www.linkedin.com/company/80045987/""},""degree_name"":"""",""field_of_study"":"""",""description"":null},{""date"":{""start"":{""month"":1,""year"":2017,""day"":null},""end"":{""month"":1,""year"":2020,""day"":null}},""school"":{""name"":""Canyon Crest Academy"",""logo"":""https://media.licdn.com/dms/image/v2/C4D0BAQHs8qvIIPHh-w/company-logo_400_400/company-logo_400_400/0/1631315915043?e=1740614400&v=beta&t=_DLcoGNX9zG2iKrM9MZhXOa6upKCxhCaKipWr0B1T1I"",""url"":""https://www.linkedin.com/company/360890/""},""degree_name"":"""",""field_of_study"":"""",""description"":null}]","[{""company"":{""id"":99440945,""name"":""Origami Agents (YC F24)"",""logo"":""https://media.licdn.com/dms/image/v2/D4E0BAQHUmtLK8rnmWQ/company-logo_400_400/company-logo_400_400/0/1732264872946/origamiagents_logo?e=1740614400&v=beta&t=viDmYuPTitbeeFCKUetc5GykqiogytaUhHxv-cTXdrU"",""url"":""https://www.linkedin.com/company/99440945/""},""date"":{""start"":{""month"":10,""year"":2024,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":10,""year"":2024,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""company"":""Origami Agents (YC F24)"",""description"":"""",""title"":""Co-Founder"",""employment_type"":null}]},{""company"":{""id"":74758844,""name"":""Fizz"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQF6Xwh04dkNYg/company-logo_400_400/company-logo_400_400/0/1630655773340?e=1740614400&v=beta&t=Nin7yQd0ce_sBXqnXtGoyeYRuVXywQU8w_mff2Cqcqo"",""url"":""https://www.linkedin.com/company/74758844/""},""date"":{""start"":{""month"":1,""year"":2021,""day"":null},""end"":{""month"":1,""year"":2024,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":1,""year"":2021,""day"":null},""end"":{""month"":1,""year"":2024,""day"":null}},""company"":""Fizz"",""description"":"""",""title"":""Launch & Operations"",""employment_type"":null}]},{""company"":{""id"":3313690,""name"":""StartX."",""logo"":""https://media.licdn.com/dms/image/v2/C4E0BAQG9OsMFZua_Lg/company-logo_400_400/company-logo_400_400/0/1631316506051?e=1740614400&v=beta&t=s-QESr4b4dos68aKCtWtIlYTH31hM385Jc9k88fBwVA"",""url"":""https://www.linkedin.com/company/3313690/""},""date"":{""start"":{""month"":1,""year"":2022,""day"":null},""end"":{""month"":1,""year"":2023,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":1,""year"":2022,""day"":null},""end"":{""month"":1,""year"":2023,""day"":null}},""company"":""StartX."",""description"":"""",""title"":""Co-Managing Director, Student Accelerator"",""employment_type"":null}]},{""company"":{""id"":1696915,""name"":""Stanford Marketing"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQFoxgxk_bVAlQ/company-logo_400_400/company-logo_400_400/0/1631351574162?e=1740614400&v=beta&t=bZHZ918BifCfAWhzz4kAFEW_IL59__nrAkoIDQGiusk"",""url"":""https://www.linkedin.com/company/1696915/""},""date"":{""start"":{""month"":1,""year"":2021,""day"":null},""end"":{""month"":1,""year"":2023,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":1,""year"":2021,""day"":null},""end"":{""month"":1,""year"":2023,""day"":null}},""company"":""Stanford Marketing"",""description"":"""",""title"":""President"",""employment_type"":null}]}]"
4,Arvind V.,Co-Founder and CEO,"San Francisco, California, United States of America",Fresco (YC F24),https://www.linkedin.com/company/104799979/,,Building Fresco (YC F24) | Acquired Founder,"I’m currently building Fresco (YC F24) an AI copilot for construction superintendents. \n\nPreviously, I was Chief of Staff and Director of Partnerships at January AI, a precision medicine company based in the Bay Area. I have my BA and MS from Brown, and I've also worked at NASA (SynBio), Human Capital (VC), and Vault Health (PM).\n\nI enjoyed an exit from my political tech startup, DownBallot Solutions, in 2022. I also make investments in early-stage technology companies, with a focus on consumer software and digital health. I'm always happy to chat about science or entrepreneurship!",,Construction,"[""B2B sales"", ""Financial Modeling"", ""Strategic Partnerships"", ""Crispr"", ""Report Writing"", ""Grant Writing"", ""Cell Culture"", ""Stem Cell Research"", ""Synthetic Biology"", ""Laboratory Management"", ""Due Diligence"", ""Investments"", ""Early-stage Startups"", ""Communication"", ""Funnel Optimization"", ""Agile Methodologies"", ""Scrum"", ""PRD"", ""Product Management"", ""Strategy"", ""Project Management"", ""Team Management"", ""Public Speaking"", ""Writing"", ""Data Analysis"", ""Web Design"", ""Leadership"", ""Research"", ""SPSS"", ""CRISPR"", ""Python"", ""Microsoft Office""]","[{""date"":{""start"":{""month"":1,""year"":2020,""day"":null},""end"":{""month"":1,""year"":2021,""day"":null}},""school"":{""name"":""Brown University"",""logo"":""https://media.licdn.com/dms/image/v2/C4E0BAQEK5eP7BQ975w/company-logo_400_400/company-logo_400_400/0/1630594275590/brown_university_logo?e=1740614400&v=beta&t=1hXgZbCSEJW-l9HSn_sPbPsHacNMptcTrL-9_BPVMDc"",""url"":""https://www.linkedin.com/company/157343/""},""degree_name"":""Master of Science - MS, Biotechnology"",""field_of_study"":""Master of Science - MS, Biotechnology"",""description"":""Thesis: “Developing an On-Demand Drug Development Platform for Uses on Earth and in Space”\nRecipient of Blue Marble Space Institute Grant and Rhode Island Space Grant""},{""date"":{""start"":{""month"":1,""year"":2016,""day"":null},""end"":{""month"":1,""year"":2020,""day"":null}},""school"":{""name"":""Brown University"",""logo"":""https://media.licdn.com/dms/image/v2/C4E0BAQEK5eP7BQ975w/company-logo_400_400/company-logo_400_400/0/1630594275590/brown_university_logo?e=1740614400&v=beta&t=1hXgZbCSEJW-l9HSn_sPbPsHacNMptcTrL-9_BPVMDc"",""url"":""https://www.linkedin.com/company/157343/""},""degree_name"":""Economics, Chemistry"",""field_of_study"":""Economics, Chemistry"",""description"":null},{""date"":{""start"":{""month"":1,""year"":2013,""day"":null},""end"":{""month"":1,""year"":2016,""day"":null}},""school"":{""name"":""Edina Senior High School"",""logo"":""https://media.licdn.com/dms/image/v2/C4E0BAQGk7cLQCMq7Zg/company-logo_400_400/company-logo_400_400/0/1630599452713?e=1740614400&v=beta&t=NuKLXFtuVUQUchcVtYHKQhWV6K8RdvL2E6pHzqWiTMo"",""url"":""https://www.linkedin.com/company/33437727/""},""degree_name"":"""",""field_of_study"":"""",""description"":null}]","[{""company"":{""id"":104799979,""name"":""Fresco (YC F24)"",""logo"":""https://media.licdn.com/dms/image/v2/D560BAQHTV-YceHFqKA/company-logo_400_400/company-logo_400_400/0/1729818106320/fresco_ai_logo?e=1740614400&v=beta&t=cTIvHKIuPb3InnGClW9Le5Bd_u06c7ZRgtvojFuUdG8"",""url"":""https://www.linkedin.com/company/104799979/""},""date"":{""start"":{""month"":9,""year"":2024,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""profile_positions"":[{""location"":""San Francisco, California, United States · On-site"",""date"":{""start"":{""month"":9,""year"":2024,""day"":null},""end"":{""year"":null,""month"":null,""day"":null}},""company"":""Fresco (YC F24)"",""description"":"""",""title"":""Co-Founder and CEO"",""employment_type"":""Full-time""}]},{""company"":{""id"":18116817,""name"":""January AI"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQGxoiNd9WXf2Q/company-logo_400_400/company-logo_400_400/0/1640115655377/january_inc_logo?e=1740614400&v=beta&t=KAfSrpfl2pfIsc1rx04H20-UoKFqBvBbCchltMQbUWY"",""url"":""https://www.linkedin.com/company/18116817/""},""date"":{""start"":{""month"":10,""year"":2022,""day"":null},""end"":{""month"":9,""year"":2024,""day"":null}},""profile_positions"":[{""location"":""Menlo Park, California, United States"",""date"":{""start"":{""month"":10,""year"":2022,""day"":null},""end"":{""month"":9,""year"":2024,""day"":null}},""company"":""January AI"",""description"":""As Chief of Staff, I worked closely with our CEO on key strategic and operational initiatives across all areas of the business.\n\nAs Director of Partnerships, I worked directly with a number of B2B partners and clients to create shared value. Responsible for sourcing, proposing, and negotiating deals, along with associated financial modeling."",""title"":""Chief of Staff and Director of Partnerships"",""employment_type"":""Full-time""}]},{""company"":{""id"":18941883,""name"":""Vault Health"",""logo"":""https://media.licdn.com/dms/image/v2/D4E0BAQF82lFxVrRzZQ/company-logo_400_400/company-logo_400_400/0/1705415552839/vaulthealth_logo?e=1740614400&v=beta&t=qVrj0q6zPt7XWMRIs5tr_46xJfVZqs9Ts4fpDckq9oc"",""url"":""https://www.linkedin.com/company/18941883/""},""date"":{""start"":{""month"":5,""year"":2022,""day"":null},""end"":{""month"":10,""year"":2022,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":5,""year"":2022,""day"":null},""end"":{""month"":10,""year"":2022,""day"":null}},""company"":""Vault Health"",""description"":""Skills: Product Management · Scrum · PRD · Agile Methodologies · Project Management"",""title"":""Product Manager"",""employment_type"":""Full-time""}]},{""company"":{""id"":null,""name"":""Downballot Solutions"",""logo"":null,""url"":""https://www.linkedin.com/search/results/all/?keywords=Downballot+Solutions""},""date"":{""start"":{""month"":5,""year"":2020,""day"":null},""end"":{""month"":3,""year"":2022,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":5,""year"":2020,""day"":null},""end"":{""month"":3,""year"":2022,""day"":null}},""company"":""Downballot Solutions"",""description"":""Developing data-driven campaign solutions for local politicians nationwide.\n\nBootstrapped to $200k ARR before enjoying an exit in March 2022."",""title"":""Founder, CFO"",""employment_type"":""Self-employed""}]},{""company"":{""id"":17901964,""name"":""Human Capital"",""logo"":""https://media.licdn.com/dms/image/v2/D560BAQHleqSsSTd8Ng/company-logo_400_400/company-logo_400_400/0/1683302843014/humandotcapital_logo?e=1740614400&v=beta&t=C0nA5YyBWasbP8ObN5rRavj8jwaSU0xNQ6BvjGH2S5c"",""url"":""https://www.linkedin.com/company/17901964/""},""date"":{""start"":{""month"":8,""year"":2021,""day"":null},""end"":{""month"":2,""year"":2022,""day"":null}},""profile_positions"":[{""location"":""San Francisco, California, United States"",""date"":{""start"":{""month"":8,""year"":2021,""day"":null},""end"":{""month"":2,""year"":2022,""day"":null}},""company"":""Human Capital"",""description"":""Skills: Investments · Due Diligence · Early-stage Startups · Communication · Funnel Optimization"",""title"":""Associate"",""employment_type"":""Full-time""}]},{""company"":{""id"":2003,""name"":""NASA - National Aeronautics and Space Administration"",""logo"":""https://media.licdn.com/dms/image/v2/C4D0BAQGRBHWCcaAqGg/company-logo_400_400/company-logo_400_400/0/1630507197379/nasa_logo?e=1740614400&v=beta&t=ADsvfi3KEHNoFYT2YdTLnkm0dC71qWXnS9gzZAd8XMI"",""url"":""https://www.linkedin.com/company/2003/""},""date"":{""start"":{""month"":3,""year"":2018,""day"":null},""end"":{""month"":6,""year"":2021,""day"":null}},""profile_positions"":[{""location"":""Mountain View, California, United States"",""date"":{""start"":{""month"":5,""year"":2020,""day"":null},""end"":{""month"":6,""year"":2021,""day"":null}},""company"":""NASA - National Aeronautics and Space Administration"",""description"":""Skills: Public Speaking · Crispr · Report Writing · Grant Writing"",""title"":""Synthetic Biologist"",""employment_type"":null},{""location"":""Mountain View, CA"",""date"":{""start"":{""month"":5,""year"":2019,""day"":null},""end"":{""month"":9,""year"":2019,""day"":null}},""company"":""NASA - National Aeronautics and Space Administration"",""description"":""Coordinated a team of student researchers in the creation of a small, portable pharmacy which uses synthetic biology to produce drugs sustainably and on-demand. This project has terrestrial and off-world applications."",""title"":""Lead Student Researcher"",""employment_type"":null},{""location"":""Mountain View, CA"",""date"":{""start"":{""month"":3,""year"":2018,""day"":null},""end"":{""month"":9,""year"":2018,""day"":null}},""company"":""NASA - National Aeronautics and Space Administration"",""description"":""Designed CRISPR experiments to optimize filamentous fungus growth for fungus-based Mars habitat construction (\""mycotecture\""); developed a Python model for mycelium growth for building purposes; presented at NASA Advanced and Innovative Concepts (NIAC) Symposium, lobbying for $500k in funding."",""title"":""Synthetic Biology Student Researcher"",""employment_type"":null}]},{""company"":{""id"":3181,""name"":""University of Minnesota-Twin Cities"",""logo"":""https://media.licdn.com/dms/image/v2/D560BAQEKTpIfhAXtlw/company-logo_400_400/company-logo_400_400/0/1719939334329/university_of_minnesota_logo?e=1740614400&v=beta&t=46foXeUPCBHxTgD7n5VeHEeKVISPMiR1pGixkWcd-gw"",""url"":""https://www.linkedin.com/company/3181/""},""date"":{""start"":{""month"":5,""year"":2017,""day"":null},""end"":{""month"":10,""year"":2017,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":5,""year"":2017,""day"":null},""end"":{""month"":10,""year"":2017,""day"":null}},""company"":""University of Minnesota-Twin Cities"",""description"":""Conducted data analysis on Challenge and Chronic studies, breakthrough treatments which attempt to use intranasal oxytocin (IN-OT) to mediate the symptoms of autism; recruited subjects for national SPARK registry and for further research projects; assisted in due diligence on the AV1ATION study (also IN-OT) conducted by Roche."",""title"":""Researcher"",""employment_type"":null}]},{""company"":{""id"":9238,""name"":""University of Minnesota Medical Center"",""logo"":""https://media.licdn.com/dms/image/v2/C560BAQEiddTvORvQRw/company-logo_400_400/company-logo_400_400/0/1631349859244?e=1740614400&v=beta&t=5zmNUQANn2bPmjGBKrtdo3o-LXSK4hqtF-LAv1B0ATQ"",""url"":""https://www.linkedin.com/company/9238/""},""date"":{""start"":{""month"":5,""year"":2015,""day"":null},""end"":{""month"":8,""year"":2015,""day"":null}},""profile_positions"":[{""location"":null,""date"":{""start"":{""month"":5,""year"":2015,""day"":null},""end"":{""month"":8,""year"":2015,""day"":null}},""company"":""University of Minnesota Medical Center"",""description"":""Conducted literature reviews with postdoctoral fellows; worked with data sets; evaluated efficiency of screening process."",""title"":""Research Assistant"",""employment_type"":null}]}]"


In [3]:
# Helper function to extract the "name" field using a simple regex
def extract_names_simple(data_str):
    try:
        # Find all occurrences of "name": "value"
        names = re.findall(r'"name":\s?"(.*?)"', data_str)
        return ", ".join(names) if names else None
    except Exception as e:
        return None  # Return None if parsing fails

# Helper function to convert the skills column into a readable string
def process_skills(skills_str):
    try:
        # Convert the string representation of a list into an actual list
        skills_list = ast.literal_eval(skills_str)
        if isinstance(skills_list, list):
            return ", ".join(skills_list)  # Join the list into a string
        return skills_str  # If not a list, return the original string
    except (ValueError, SyntaxError):
        return None  # Return None if parsing fails

# Apply the updated function to the education, work history, and skills columns
def preprocess_columns_simple(df):
    df['education'] = df['education'].apply(extract_names_simple)
    df['work_history'] = df['work_history'].apply(extract_names_simple)
    df['skills'] = df['skills'].apply(process_skills)
    return df

# Preprocess the dataset
people_preprocessed = preprocess_columns_simple(people_filtered.copy())


In [4]:
# Helper function to generate a descriptive paragraph for each row
def generate_paragraph(row):
    # Start the paragraph with basic information
    full_name = row.get('full_name', None)
    title = row.get('title', None)
    company = row.get('company', None)
    location = row.get('location', None)
    company_description = row.get('company_description', None)
    sub_title = row.get('sub_title', None)
    summary = row.get('summary', None)
    current_job_description = row.get('current_job_description', None)
    skills = row.get('skills', None)
    education = row.get('education', None)
    work_history = row.get('work_history', None)

    # Build the descriptive paragraph dynamically
    sentences = []

    if full_name and title and company:
        sentences.append(f"{full_name}, currently working as {title} at {company}.")
    if location:
        sentences[-1] += f" They are based in {location}."
    if company_description:
        sentences.append(f"{company} specializes in {company_description}.")
    if sub_title:
        sentences.append(f"Sub-title: {sub_title}.")
    if summary:
        sentences.append(f"Summary: {summary}.")
    if current_job_description:
        sentences.append(f"Current Job Description: {current_job_description}.")
    if skills:
        sentences.append(f"Their skills include: {skills}.")
    if education:
        sentences.append(f"Their educational background includes: {education}.")
    if work_history:
        sentences.append(f"They have worked in roles such as: {work_history}.")

    # Combine sentences into a single paragraph
    return " ".join(sentences)

# Apply the function to generate paragraphs
people_preprocessed['descriptive_paragraph'] = people_preprocessed.apply(generate_paragraph, axis=1)

# Display a few sample paragraphs
print("Sample Descriptive Paragraphs:")
display(people_preprocessed[['full_name', 'descriptive_paragraph']].head())


Sample Descriptive Paragraphs:


Unnamed: 0,full_name,descriptive_paragraph
0,Edward Aryee,"Edward Aryee, currently working as Co-Founder & CTO at SRE.ai (YC F24). They are based in San Francisco Bay, San Francisco Bay Area, United States of America. SRE.ai (YC F24) specializes in nan. Sub-title: Co-Founder & CTO at SRE.ai (YC F24) | ex-Google. Summary: nan. Current Job Description: An AI-powered automation platform for Salesforce development teams.. Their skills include: Programming, Python, Java, JavaScript, Matlab, Computer Science, Public Speaking. Their educational background includes: Drexel University. They have worked in roles such as: SRE.ai (YC F24), Black Angel Group (BAG), Google, Microsoft, StratIS IoT, Web Presence in China, BuLogics, Virtual Pantry, Columbia University."
1,Victor Cheng,"Victor Cheng, currently working as Co-Founder and CEO at vly.ai (YC F24). They are based in San Francisco, California, United States of America. vly.ai (YC F24) specializes in nan. Sub-title: co-founder @ vly.ai (YC F24). Summary: cooking. Current Job Description: The easiest way to build custom full-stack software without code. Backed by Y Combinator. Their skills include: Startups, TypeScript, Git, Express.js, MongoDB, Full-Stack Development, Node.js, Competitive Programming, Next.js, Software Development, React.js, C++, JavaScript, C#, Java, Unity3D, Business, Mathematics, Robotics, Mobile Application Development, Android Studio. Their educational background includes: University of Washington, Skyline High School, Y Combinator. They have worked in roles such as: vly.ai (YC F24), Hatch Coding, Minute Land, Quantum Labs, Autodesk, FRC Team 2976, Spartabots, Self-employed."
2,Daryl Budiman,"Daryl Budiman, currently working as Co-Founder & CEO at Andoria (YC F24). They are based in San Francisco Bay, San Francisco Bay Area, United States of America. Andoria (YC F24) specializes in nan. Sub-title: Co-Founder at Andoria (YC F24) | Prev. MultiOn & Stanford. Summary: Imagine if you didn't have to learn any piece of software anymore.. Current Job Description: Backed by YC, among other great investors.. Their skills include: Customer Onboarding, Customer Success, SwiftUI, C++, React.js, Microsoft PowerPoint, HTML, CSS, JavaScript, Python, Presentation Skills, Public Speaking, Adobe Photoshop, Research, ArcGIS, Figma, Leadership, User Interface Design, Computer-Aided Design (CAD), Autodesk Fusion 360. Their educational background includes: Stanford University, Y Combinator. They have worked in roles such as: Andoria (YC F24), MultiOn, Amazon, The Marriage Pact, Evernote, Matcha, Stanford University School of Medicine."
3,Finn Mallery,"Finn Mallery, currently working as Co-Founder at Origami Agents (YC F24). They are based in Palo Alto, California, United States of America. Origami Agents (YC F24) specializes in nan. Sub-title: Co-Founder @ Origami Agents (YC F24). Summary: nan. Current Job Description: nan. Their educational background includes: Stanford University, Stanford University School of Engineering, Z Fellows, Canyon Crest Academy. They have worked in roles such as: Origami Agents (YC F24), Fizz, StartX., Stanford Marketing."
4,Arvind V.,"Arvind V., currently working as Co-Founder and CEO at Fresco (YC F24). They are based in San Francisco, California, United States of America. Fresco (YC F24) specializes in nan. Sub-title: Building Fresco (YC F24) | Acquired Founder. Summary: I’m currently building Fresco (YC F24) an AI copilot for construction superintendents. \n\nPreviously, I was Chief of Staff and Director of Partnerships at January AI, a precision medicine company based in the Bay Area. I have my BA and MS from Brown, and I've also worked at NASA (SynBio), Human Capital (VC), and Vault Health (PM).\n\nI enjoyed an exit from my political tech startup, DownBallot Solutions, in 2022. I also make investments in early-stage technology companies, with a focus on consumer software and digital health. I'm always happy to chat about science or entrepreneurship!. Current Job Description: nan. Their skills include: B2B sales, Financial Modeling, Strategic Partnerships, Crispr, Report Writing, Grant Writing, Cell Culture, Stem Cell Research, Synthetic Biology, Laboratory Management, Due Diligence, Investments, Early-stage Startups, Communication, Funnel Optimization, Agile Methodologies, Scrum, PRD, Product Management, Strategy, Project Management, Team Management, Public Speaking, Writing, Data Analysis, Web Design, Leadership, Research, SPSS, CRISPR, Python, Microsoft Office. Their educational background includes: Brown University, Brown University, Edina Senior High School. They have worked in roles such as: Fresco (YC F24), January AI, Vault Health, Downballot Solutions, Human Capital, NASA - National Aeronautics and Space Administration, University of Minnesota-Twin Cities, University of Minnesota Medical Center."


In [6]:
# Load the new dataset
personal_data_path = './data/Sudarshan Sridharan People.csv'
personal_data = pd.read_csv(personal_data_path)

# Preprocessing functions reused from the previous notebook
# (No need to redefine extract_names_simple and process_skills)

# Helper function to process the new file into a descriptive paragraph
def generate_advertising_paragraph(row):
    # Basic information
    full_name = row.get('full_name', None)
    title = row.get('title', None)
    company = row.get('company', None)
    location = row.get('location', None)
    company_description = row.get('company_description', None)
    work_history = row.get('work_history', None)
    education = row.get('education', None)
    skills = row.get('skills', None)

    # Build the paragraph dynamically
    sentences = []
    
    if full_name and title and company:
        sentences.append(f"{full_name} is the {title} at {company}.")
    if location:
        sentences[-1] += f" They are based in {location}."
    if company_description:
        sentences.append(f"{company} focuses on: {company_description}.")
    if skills:
        sentences.append(f"Key skills include: {skills}.")
    if education:
        sentences.append(f"Educational background includes: {education}.")
    if work_history:
        sentences.append(f"Past work includes roles such as: {work_history}.")

    # Combine and clean up
    return " ".join(sentences)

# Preprocess the new dataset
personal_data['education'] = personal_data['education'].apply(extract_names_simple)
personal_data['work_history'] = personal_data['work_history'].apply(extract_names_simple)
personal_data['skills'] = personal_data['skills'].apply(process_skills)

# Generate the descriptive paragraph
personal_data['advertising_paragraph'] = personal_data.apply(generate_advertising_paragraph, axis=1)

# Display the output
print("Sample Advertising Paragraphs:")
display(personal_data[['full_name', 'advertising_paragraph']].head())


Sample Advertising Paragraphs:


Unnamed: 0,full_name,advertising_paragraph
0,Sudarshan Sridharan,"Sudarshan Sridharan is the Founder at Pipeline. They are based in San Francisco Bay, San Francisco Bay Area, United States of America. Pipeline focuses on: Get more leads, close more deals. Pipeline sets-up and manages the outbound sales stack for early stage B2B startups. Automate your sales.... Key skills include: Investing. Educational background includes: Clemson University. Past work includes roles such as: Pipeline, Fion Technologies, SaveMAPS, Second Reality Interactive, INC., Peak 15 Capital."


In [10]:
# Ensure 'people_preprocessed' and 'new_people_data' DataFrames exist from previous steps

# Extract the single paragraph from the new people's data
advertising_paragraph = personal_data['advertising_paragraph'].iloc[0]  # Assuming only one row

# Create a DataFrame with pairs of paragraphs
paired_paragraphs = people_preprocessed[['full_name', 'descriptive_paragraph']].copy()
paired_paragraphs['advertising_paragraph'] = advertising_paragraph  # Add the single advertising paragraph to all rows

# Display the paired paragraphs
print("Paired Paragraphs (Personal Profile and Advertising Profile):")
display(paired_paragraphs.head())


Paired Paragraphs (Personal Profile and Advertising Profile):


Unnamed: 0,full_name,descriptive_paragraph,advertising_paragraph
0,Edward Aryee,"Edward Aryee, currently working as Co-Founder & CTO at SRE.ai (YC F24). They are based in San Francisco Bay, San Francisco Bay Area, United States of America. SRE.ai (YC F24) specializes in nan. Sub-title: Co-Founder & CTO at SRE.ai (YC F24) | ex-Google. Summary: nan. Current Job Description: An AI-powered automation platform for Salesforce development teams.. Their skills include: Programming, Python, Java, JavaScript, Matlab, Computer Science, Public Speaking. Their educational background includes: Drexel University. They have worked in roles such as: SRE.ai (YC F24), Black Angel Group (BAG), Google, Microsoft, StratIS IoT, Web Presence in China, BuLogics, Virtual Pantry, Columbia University.","Sudarshan Sridharan is the Founder at Pipeline. They are based in San Francisco Bay, San Francisco Bay Area, United States of America. Pipeline focuses on: Get more leads, close more deals. Pipeline sets-up and manages the outbound sales stack for early stage B2B startups. Automate your sales.... Key skills include: Investing. Educational background includes: Clemson University. Past work includes roles such as: Pipeline, Fion Technologies, SaveMAPS, Second Reality Interactive, INC., Peak 15 Capital."
1,Victor Cheng,"Victor Cheng, currently working as Co-Founder and CEO at vly.ai (YC F24). They are based in San Francisco, California, United States of America. vly.ai (YC F24) specializes in nan. Sub-title: co-founder @ vly.ai (YC F24). Summary: cooking. Current Job Description: The easiest way to build custom full-stack software without code. Backed by Y Combinator. Their skills include: Startups, TypeScript, Git, Express.js, MongoDB, Full-Stack Development, Node.js, Competitive Programming, Next.js, Software Development, React.js, C++, JavaScript, C#, Java, Unity3D, Business, Mathematics, Robotics, Mobile Application Development, Android Studio. Their educational background includes: University of Washington, Skyline High School, Y Combinator. They have worked in roles such as: vly.ai (YC F24), Hatch Coding, Minute Land, Quantum Labs, Autodesk, FRC Team 2976, Spartabots, Self-employed.","Sudarshan Sridharan is the Founder at Pipeline. They are based in San Francisco Bay, San Francisco Bay Area, United States of America. Pipeline focuses on: Get more leads, close more deals. Pipeline sets-up and manages the outbound sales stack for early stage B2B startups. Automate your sales.... Key skills include: Investing. Educational background includes: Clemson University. Past work includes roles such as: Pipeline, Fion Technologies, SaveMAPS, Second Reality Interactive, INC., Peak 15 Capital."
2,Daryl Budiman,"Daryl Budiman, currently working as Co-Founder & CEO at Andoria (YC F24). They are based in San Francisco Bay, San Francisco Bay Area, United States of America. Andoria (YC F24) specializes in nan. Sub-title: Co-Founder at Andoria (YC F24) | Prev. MultiOn & Stanford. Summary: Imagine if you didn't have to learn any piece of software anymore.. Current Job Description: Backed by YC, among other great investors.. Their skills include: Customer Onboarding, Customer Success, SwiftUI, C++, React.js, Microsoft PowerPoint, HTML, CSS, JavaScript, Python, Presentation Skills, Public Speaking, Adobe Photoshop, Research, ArcGIS, Figma, Leadership, User Interface Design, Computer-Aided Design (CAD), Autodesk Fusion 360. Their educational background includes: Stanford University, Y Combinator. They have worked in roles such as: Andoria (YC F24), MultiOn, Amazon, The Marriage Pact, Evernote, Matcha, Stanford University School of Medicine.","Sudarshan Sridharan is the Founder at Pipeline. They are based in San Francisco Bay, San Francisco Bay Area, United States of America. Pipeline focuses on: Get more leads, close more deals. Pipeline sets-up and manages the outbound sales stack for early stage B2B startups. Automate your sales.... Key skills include: Investing. Educational background includes: Clemson University. Past work includes roles such as: Pipeline, Fion Technologies, SaveMAPS, Second Reality Interactive, INC., Peak 15 Capital."
3,Finn Mallery,"Finn Mallery, currently working as Co-Founder at Origami Agents (YC F24). They are based in Palo Alto, California, United States of America. Origami Agents (YC F24) specializes in nan. Sub-title: Co-Founder @ Origami Agents (YC F24). Summary: nan. Current Job Description: nan. Their educational background includes: Stanford University, Stanford University School of Engineering, Z Fellows, Canyon Crest Academy. They have worked in roles such as: Origami Agents (YC F24), Fizz, StartX., Stanford Marketing.","Sudarshan Sridharan is the Founder at Pipeline. They are based in San Francisco Bay, San Francisco Bay Area, United States of America. Pipeline focuses on: Get more leads, close more deals. Pipeline sets-up and manages the outbound sales stack for early stage B2B startups. Automate your sales.... Key skills include: Investing. Educational background includes: Clemson University. Past work includes roles such as: Pipeline, Fion Technologies, SaveMAPS, Second Reality Interactive, INC., Peak 15 Capital."
4,Arvind V.,"Arvind V., currently working as Co-Founder and CEO at Fresco (YC F24). They are based in San Francisco, California, United States of America. Fresco (YC F24) specializes in nan. Sub-title: Building Fresco (YC F24) | Acquired Founder. Summary: I’m currently building Fresco (YC F24) an AI copilot for construction superintendents. \n\nPreviously, I was Chief of Staff and Director of Partnerships at January AI, a precision medicine company based in the Bay Area. I have my BA and MS from Brown, and I've also worked at NASA (SynBio), Human Capital (VC), and Vault Health (PM).\n\nI enjoyed an exit from my political tech startup, DownBallot Solutions, in 2022. I also make investments in early-stage technology companies, with a focus on consumer software and digital health. I'm always happy to chat about science or entrepreneurship!. Current Job Description: nan. Their skills include: B2B sales, Financial Modeling, Strategic Partnerships, Crispr, Report Writing, Grant Writing, Cell Culture, Stem Cell Research, Synthetic Biology, Laboratory Management, Due Diligence, Investments, Early-stage Startups, Communication, Funnel Optimization, Agile Methodologies, Scrum, PRD, Product Management, Strategy, Project Management, Team Management, Public Speaking, Writing, Data Analysis, Web Design, Leadership, Research, SPSS, CRISPR, Python, Microsoft Office. Their educational background includes: Brown University, Brown University, Edina Senior High School. They have worked in roles such as: Fresco (YC F24), January AI, Vault Health, Downballot Solutions, Human Capital, NASA - National Aeronautics and Space Administration, University of Minnesota-Twin Cities, University of Minnesota Medical Center.","Sudarshan Sridharan is the Founder at Pipeline. They are based in San Francisco Bay, San Francisco Bay Area, United States of America. Pipeline focuses on: Get more leads, close more deals. Pipeline sets-up and manages the outbound sales stack for early stage B2B startups. Automate your sales.... Key skills include: Investing. Educational background includes: Clemson University. Past work includes roles such as: Pipeline, Fion Technologies, SaveMAPS, Second Reality Interactive, INC., Peak 15 Capital."


In [8]:
import anthropic

client = anthropic.Anthropic(api_key=ANTHROPIC_API_KEY)

message = client.messages.create(
    model="claude-3-5-sonnet-20241022",
    max_tokens=1000,
    temperature=0,
    system="You are a world-class poet. Respond only with short poems.",
    messages=[
        {
            "role": "user",
            "content": [
                {
                    "type": "text",
                    "text": "Why is the ocean salty?"
                }
            ]
        }
    ]
)
print(message.content)


KeyboardInterrupt: 