#### Create Final Table that will be sent to LLM Model

In [0]:
# Read the data from the intermediate table
df_investments_funding = spark.read.table("dev_db.intermediate.investments_funding")
df_active_companies = spark.read.table("dev_db.intermediate.active_companies")

In [0]:
# Get the latest date for each org_uuid
df_latest_raise = (
    df_investments_funding.groupBy("org_uuid")
    .agg({"announced_on": "max"})
    .withColumnRenamed("MAX(announced_on)", "latest_raise")
)

In [0]:
# Get the amount raised, investments for latest raise for each org_uuid
import pyspark.sql.functions as F

df_latest_funding = (
    df_latest_raise.alias("a")
    .join(
        df_investments_funding.alias("b"),
        (F.col("a.org_uuid") == F.col("b.org_uuid"))
        & (F.col("a.latest_raise") == F.col("b.announced_on")),
        "left",
    )
    .groupBy("a.org_uuid", "a.latest_raise")
    .agg(
        F.sum(F.col("b.raised_amount_usd")).alias("raised_amount"),
        F.array_join(F.collect_set(F.col("b.investments")), ", ").alias("investments"),
    )
)

In [0]:
from pyspark.sql.functions import col, concat_ws, lit

# Join Active companies to latest funding to get each company's latest funding
df_active_companies_latest = df_active_companies.join(
    df_latest_funding, on="org_uuid", how="left"
).select(
    col("org_uuid"),
    col("name"),
    col("org_type"),
    col("country_code"),
    col("homepage_url"),
    col("status"),
    col("description"),
    col("investments"),
    concat_ws(
        " ",
        col("description"),
        lit(" Website: "),
        col("homepage_url"),
        lit(" Headquarter: "),
        col("country_code"),
        lit(" Recent Investments: "),
        col("investments"),
        lit(" Amount Raised: "),
        col("raised_amount"),
        lit(" Date Announced: "),
        col("latest_raise"),
    ).alias("company_information"),
)

In [0]:
# Write the table to Unity Catalog.
df_active_companies_latest.write.format("delta").mode("overwrite").option("overwriteSchema", "true").saveAsTable("dev_db.core.active_companies_information")

In [0]:
%sql
select * from dev_db.core.active_companies_information

org_uuid,name,org_type,country_code,homepage_url,status,description,investments,company_information
8c57c3c2-e65b-e45b-c754-89dc9f85580a,Gaia Online,organization,USA,https://www.gaiaonline.com/,operating,"Gaia Online has grown into one of the biggest forum communities in the world. Today, Gaia is the best place on the web to discuss anime, games, comics, sci-fi, fantasy and anything else you can imagine. Plus, there are tons of other free features to keep Gaia members permanently amused.",IVP investment in Series C - Gaia Online,"Gaia Online has grown into one of the biggest forum communities in the world. Today, Gaia is the best place on the web to discuss anime, games, comics, sci-fi, fantasy and anything else you can imagine. Plus, there are tons of other free features to keep Gaia members permanently amused. Website: https://www.gaiaonline.com/ Headquarter: USA Recent Investments: IVP investment in Series C - Gaia Online Amount Raised: 11000000 Date Announced: 2008-07-14"
6d2fff57-32b5-f75c-9986-97539d1bf366,Viddler,organization,USA,http://www.viddler.com,operating,"Viddler has a long history of innovation in online video, developing patented new approaches, and transforming video from a passive viewing experience to an interactive, measurable, user-centered one. Backed by a powerful, secure content delivery network, Viddler delivers millions of videos for thousands of businesses around the world every day. Mobile technology is everywhere. To accommodate this, Viddler has developed far-reaching HTML5 video player technology—expanding the concept of “learn anywhere” interactivity between instructors and students or consultants and clients. We are focused on: our innovation, our interactive video player, and our strong customer service. Our player systems allow us to have people who truly understand the message of a learning video because we refuse to have a passive user viewing experience.",,"Viddler has a long history of innovation in online video, developing patented new approaches, and transforming video from a passive viewing experience to an interactive, measurable, user-centered one. Backed by a powerful, secure content delivery network, Viddler delivers millions of videos for thousands of businesses around the world every day. Mobile technology is everywhere. To accommodate this, Viddler has developed far-reaching HTML5 video player technology—expanding the concept of “learn anywhere” interactivity between instructors and students or consultants and clients. We are focused on: our innovation, our interactive video player, and our strong customer service. Our player systems allow us to have people who truly understand the message of a learning video because we refuse to have a passive user viewing experience. Website: http://www.viddler.com Headquarter: USA Recent Investments: Amount Raised: 294638 Date Announced: 2012-04-06"
0cf4f50a-b749-04be-589f-301dc97dc6b5,Music Intelligence Solutions,organization,USA,https://uplaya.com,operating,"Music Intelligence Solutions, Inc.,is a ''smart'' music discovery player. MIS is a global digital media corporation with offices in San Francisco, CA; Savannah, GA; and Barcelona, Spain. The Company uses patent-approved technology to enhance the consumer experience with digital content including music and video. Ecosystem partners and customers include major music labels, digital media companies, mobile services providers and web 2.0 Internet services companies such as social networks and online retail portals. The approaches used by MIS across all product lines incorporate decades of development by the original research and development team, which consisted of musicians as well as world-class PHD physicists and mathematicians.",,"Music Intelligence Solutions, Inc.,is a ''smart'' music discovery player. MIS is a global digital media corporation with offices in San Francisco, CA; Savannah, GA; and Barcelona, Spain. The Company uses patent-approved technology to enhance the consumer experience with digital content including music and video. Ecosystem partners and customers include major music labels, digital media companies, mobile services providers and web 2.0 Internet services companies such as social networks and online retail portals. The approaches used by MIS across all product lines incorporate decades of development by the original research and development team, which consisted of musicians as well as world-class PHD physicists and mathematicians. Website: https://uplaya.com Headquarter: USA Recent Investments: Amount Raised: 7000000 Date Announced: 2006-12-10"
6580c555-b205-0217-a183-4f42ce114765,Ampersand Capital Partners,organization,USA,http://www.ampersandcapital.com,operating,Ampersand is a middle market private equity firm that focuses on healthcare and industrial sectors.,,Ampersand is a middle market private equity firm that focuses on healthcare and industrial sectors. Website: http://www.ampersandcapital.com Headquarter: USA Recent Investments: Amount Raised: 18834000 Date Announced: 2023-06-29
5f932f59-dcec-0faa-c93c-4b524228e529,Akampus,organization,TUR,http://www.akampusyouth.com,operating,"Akampus is a youth marketing agency established in Istanbul, Turkey. It is a social network ''''a la Facebook'''' for college students and graduates. Akampus specializes in youth and social media marketing, youth crowdsourcing, advertising, guerilla marketing, promotions, and event marketing. It is a platform that helps companies reach the teen to young adult demographic group. Akampus was founded by entrepreneurs Ibrahim Ugdul and Evren Güney in August 2000. They chose Bogazici University in Istanbul as a starting community in 2000, and now, Akampus targets all Turkish university students, graduates, and Turkish-speaking students in universities abroad.",,"Akampus is a youth marketing agency established in Istanbul, Turkey. It is a social network ''''a la Facebook'''' for college students and graduates. Akampus specializes in youth and social media marketing, youth crowdsourcing, advertising, guerilla marketing, promotions, and event marketing. It is a platform that helps companies reach the teen to young adult demographic group. Akampus was founded by entrepreneurs Ibrahim Ugdul and Evren Güney in August 2000. They chose Bogazici University in Istanbul as a starting community in 2000, and now, Akampus targets all Turkish university students, graduates, and Turkish-speaking students in universities abroad. Website: http://www.akampusyouth.com Headquarter: TUR Recent Investments: Amount Raised: Date Announced: 2000-01-01"
8d71fc18-7185-5f38-6681-8d4c683bfa47,Alibris,organization,USA,http://www.alibris.com,operating,"Alibris (pronounced ''uh-LEE-briss'') is the premier online marketplace for independent sellers of new and used books, music, and movies, as well as rare and collectible titles. They connect people who love books, music, and movies to more than 100 million items from thousands of sellers worldwide. Since launching in November 1998, They've grown to become the Internet’s largest independently owned and operated marketplace. Join them in their second decade. They promise you'll always be able to find plenty of good books, music, and movies. We look forward to many more years together.",,"Alibris (pronounced ''uh-LEE-briss'') is the premier online marketplace for independent sellers of new and used books, music, and movies, as well as rare and collectible titles. They connect people who love books, music, and movies to more than 100 million items from thousands of sellers worldwide. Since launching in November 1998, They've grown to become the Internet’s largest independently owned and operated marketplace. Join them in their second decade. They promise you'll always be able to find plenty of good books, music, and movies. We look forward to many more years together. Website: http://www.alibris.com Headquarter: USA Recent Investments: Amount Raised: 4800000 Date Announced: 2004-02-01"
fb70402d-641d-97be-51a3-63651ff9b532,KQED,organization,USA,http://www.kqed.org,operating,"We're your NorCal NPR and PBS stations, and this is us on Pinterest.",Patrick J. McGovern Foundation investment in Grant - KQED,"We're your NorCal NPR and PBS stations, and this is us on Pinterest. Website: http://www.kqed.org Headquarter: USA Recent Investments: Patrick J. McGovern Foundation investment in Grant - KQED Amount Raised: 200000 Date Announced: 2022-01-19"
bbf2555d-6b35-2109-b1b0-171cbd044495,AlphaClone,organization,USA,http://www.alphaclone.com,operating,"AlphaClone is an investment advisory and research firm that enables long-term investors to access alpha-generating stock ideas and investment strategies. The company's investment research approach, a process called ''cloning'', utilizes hedge fund public disclosures to construct and backtest equity investment strategies. The firm’s investment research and strategies are available for investors through managed accounts and exchange-traded funds. AlphaClone was founded in 2008 with a mission to help people regain control over their investment portfolios. It is headquartered in San Francisco, California.",Operative Capital investment in Series A - AlphaClone,"AlphaClone is an investment advisory and research firm that enables long-term investors to access alpha-generating stock ideas and investment strategies. The company's investment research approach, a process called ''cloning'', utilizes hedge fund public disclosures to construct and backtest equity investment strategies. The firm’s investment research and strategies are available for investors through managed accounts and exchange-traded funds. AlphaClone was founded in 2008 with a mission to help people regain control over their investment portfolios. It is headquartered in San Francisco, California. Website: http://www.alphaclone.com Headquarter: USA Recent Investments: Operative Capital investment in Series A - AlphaClone Amount Raised: 2250000 Date Announced: 2015-09-15"
e95920a2-4124-862f-0bad-88ed2b1d2c5b,Profit Point,organization,USA,http://www.profitpt.com,operating,"Profit Point Inc. was founded in 1995 and is now a global leader in supply chain optimization. The company's team of supply chain consultants includes industry leaders in the fields infrastructure planning, green operations, supply chain planning, distribution, scheduling, transportation, warehouse improvement and business optimization. Profit Point's combined software and service solutions that have been successfully applied across a breadth of industries and by a diverse set of companies, including Dow Chemical, Coca-Cola, Lifetech, Logitech and Toyota.",Square 1 Bank investment in Debt Financing - Profit Point,"Profit Point Inc. was founded in 1995 and is now a global leader in supply chain optimization. The company's team of supply chain consultants includes industry leaders in the fields infrastructure planning, green operations, supply chain planning, distribution, scheduling, transportation, warehouse improvement and business optimization. Profit Point's combined software and service solutions that have been successfully applied across a breadth of industries and by a diverse set of companies, including Dow Chemical, Coca-Cola, Lifetech, Logitech and Toyota. Website: http://www.profitpt.com Headquarter: USA Recent Investments: Square 1 Bank investment in Debt Financing - Profit Point Amount Raised: 2500000 Date Announced: 2011-08-30"
37814cee-be4c-3c68-bd22-a6eef7db8e05,InfoUSA,organization,USA,https://www.dataaxleusa.com,operating,"Info USA offers a full range of affordable sales and marketing solutions to help businesses acquire, manage, and retain customers. These solutions include mailing lists, sales leads, search engine marketing, email marketing, direct mail marketing, data enhancement, and online marketing. Info USA is based in Papillion, Nebraska.",,"Info USA offers a full range of affordable sales and marketing solutions to help businesses acquire, manage, and retain customers. These solutions include mailing lists, sales leads, search engine marketing, email marketing, direct mail marketing, data enhancement, and online marketing. Info USA is based in Papillion, Nebraska. Website: https://www.dataaxleusa.com Headquarter: USA Recent Investments: Amount Raised: 18000000 Date Announced: 2000-06-01"
