In [1]:
from extract_transcript_link_tool import ExtractTranscriptLinkTool
from visit_web_page_tool import VisitWebPageTool
from atom_feed_tool import AtomFeedTool
from extract_trasnscript_content_tool import ExtractTranscriptContentTool
import os, json
from langchain_huggingface import HuggingFaceEmbeddings
from langchain.docstore.document import Document
from langchain.text_splitter import RecursiveCharacterTextSplitter
from transformers import AutoTokenizer
from langchain_chroma import Chroma

In [2]:
embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")

In [3]:
text_splitter = RecursiveCharacterTextSplitter.from_huggingface_tokenizer(
    AutoTokenizer.from_pretrained("thenlper/gte-small"),
    chunk_size=200,
    chunk_overlap=20,
    add_start_index=True,
    strip_whitespace=True,
    separators=["\n\n", "\n", ".", " ", ""],
)

In [4]:
feed_tool = AtomFeedTool()
response = feed_tool("https://www.thecloudcast.net/feeds/posts/default")

In [5]:
print("no of entries = ", len(response))

docs_processed = []

for entry in response:
    print("title = ", entry.title)
    print("link = ", entry.link)
    content = await VisitWebPageTool()(url=entry.link, clean_flag=False)
    transcript_link = ExtractTranscriptLinkTool()(content)
    print("transcript_link = ", transcript_link)
    if transcript_link is not None:
        transcript = await VisitWebPageTool()(url=transcript_link, clean_flag=True)
        transcript_content = ExtractTranscriptContentTool()(transcript)
        with open(os.path.join("transcripts", entry.title), "w") as f:
            f.write(transcript_content)
            print(f"Transcript content saved to {entry.title}")

        # Split the transcript content into chunks
        payload = {"title": entry.title, "link": entry.link, "content": transcript_content}
        documents = text_splitter.split_text(json.dumps(payload))

        # Create Document objects
        docs = [Document(page_content=doc) for doc in documents]
        docs_processed = docs_processed + docs

vector_store = Chroma.from_documents(docs_processed, embeddings, persist_directory="./chroma_db")

no of entries =  25
title =  Listen to The Cloudcast
link =  https://www.thecloudcast.net/2020/08/listen-to-cloudcast.html
browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Listen to The Cloudcast
Transcript tag not found.
transcript_link =  None
title =  AI Augmenting vs. Replacing
link =  https://www.thecloudcast.net/2025/04/ai-augmenting-vs-replacing.html
browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: AI Augmenting vs. Replacing
Transcript URL: https://docs.google.com/document/d/1uTt4igQ1F8i-H82E6n2SkVdS9nUGnsvPR1CNr9ft6Ak/edit?usp=sharing
transcript_link = 

huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Deep Learning Meets CyberSecurity
Transcript tag not found.
transcript_link =  None
title =  Tempering AI Expectations in the Enterprise
link =  https://www.thecloudcast.net/2025/04/tempering-ai-expectations-in-enterprise.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Tempering AI Expectations in the Enterprise
Transcript URL: https://docs.google.com/document/d/1p4ZettsIwtpXntYlFhUpYdsoL0Wvmpi61maJVEt1U68/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1p4ZettsIwtpXntYlFhUpYdsoL0Wvmpi61maJVEt1U68/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #914 - Tempering AI Expectations in the Enterprise - Google Docs
Match found in the HTML content.
Transcript content saved to Tempering AI Expectations in the Enterprise
title =  AI Agents vs. AI Assistants
link =  https://www.thecloudcast.net/2025/04/ai-agents-vs-ai-assistants.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: AI Agents vs. AI Assistants
Transcript tag not found.
transcript_link =  None
title =  How Things Can Change for the 900lb Gorilla in Tech
link =  https://www.thecloudcast.net/2025/04/how-things-can-change-for-900lb-gorilla.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: How Things Can Change for the 900lb Gorilla in Tech
Transcript URL: https://docs.google.com/document/d/1Qod9uOIBE_LUNBUkwX3l9cBMWUWNMGtzkXQwBR-M9Hc/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1Qod9uOIBE_LUNBUkwX3l9cBMWUWNMGtzkXQwBR-M9Hc/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #912 - How Things Can Change for the 900lb Gorilla in Tech - Google Docs
Match found in the HTML content.
Transcript content saved to How Things Can Change for the 900lb Gorilla in Tech
title =  AI & Cloud Trends for March 2025
link =  https://www.thecloudcast.net/2025/04/ai-cloud-trends-for-march.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: AI & Cloud Trends for March 2025
Transcript URL: https://docs.google.com/document/d/1UY197iZYzYkrteIFqm-EB_ORt8hhOm5CtX2g5GgQkIA/edit?tab=t.0
transcript_link =  https://docs.google.com/document/d/1UY197iZYzYkrteIFqm-EB_ORt8hhOm5CtX2g5GgQkIA/edit?tab=t.0


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #911 - AI & Cloud Trends for March - Google Docs
Match found in the HTML content.
Transcript content saved to AI & Cloud Trends for March 2025
title =  That Feeling of Losing Technical Knowledge
link =  https://www.thecloudcast.net/2025/03/that-feeling-of-losing-technical.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: That Feeling of Losing Technical Knowledge
Transcript URL: https://docs.google.com/document/d/1u21XAxB6b0FsYNPX4zzAMpGVWN4cQDGWyosvV6LTnN0/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1u21XAxB6b0FsYNPX4zzAMpGVWN4cQDGWyosvV6LTnN0/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #910 - That Feeling of Losing Technical Knowledge - Google Docs
Match found in the HTML content.
Transcript content saved to That Feeling of Losing Technical Knowledge
title =  Virtualizing Kubernetes Clusters
link =  https://www.thecloudcast.net/2025/03/virtualizing-kubernetes-clusters.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Virtualizing Kubernetes Clusters
Transcript URL: https://youtube.com/@TheCloudcastNET
transcript_link =  https://youtube.com/@TheCloudcastNET


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast - YouTube
Match found in the HTML content.
Transcript content saved to Virtualizing Kubernetes Clusters
title =  Are Acquisitions Making a Comeback?
link =  https://www.thecloudcast.net/2025/03/are-acquisitions-making-comeback.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Are Acquisitions Making a Comeback?
Transcript URL: https://docs.google.com/document/d/1oezDXwxvf3x7MNgCGboeAO6js0dknkV1tGtLGtx6eAk/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1oezDXwxvf3x7MNgCGboeAO6js0dknkV1tGtLGtx6eAk/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #908 - Are Acquisitions Making a Comeback? - Google Docs
Match found in the HTML content.
Transcript content saved to Are Acquisitions Making a Comeback?
title =  Migrating from Infrastructure as Code
link =  https://www.thecloudcast.net/2025/03/migrating-from-infrastructure-as-code.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Migrating from Infrastructure as Code
Transcript URL: https://docs.google.com/document/d/1a3ydUCI4wwJ_f2Jr3JCU3rDGe1oogwzytGKh_45kFiE/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1a3ydUCI4wwJ_f2Jr3JCU3rDGe1oogwzytGKh_45kFiE/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #911 - AI & Cloud Trends for March - Google Docs
Match found in the HTML content.
Transcript content saved to Migrating from Infrastructure as Code
title =  Decoding Corporate Communications
link =  https://www.thecloudcast.net/2025/03/decoding-corporate-communications.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Decoding Corporate Communications
Transcript URL: https://docs.google.com/document/d/1qcEEiw0iNV2nKxVObQW4yZ-RaOQEDPMeq1ZoQi93Rck/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1qcEEiw0iNV2nKxVObQW4yZ-RaOQEDPMeq1ZoQi93Rck/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #906 - Decoding Corporate Communications - Google Docs
Match found in the HTML content.
Transcript content saved to Decoding Corporate Communications
title =  AI Impacts Across Organizations & Startups
link =  https://www.thecloudcast.net/2025/03/ai-impacts-across-organizations-startups.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: AI Impacts Across Organizations & Startups
Transcript URL: https://docs.google.com/document/d/1pN5ASdgkfU9GVona-grgdcxcPPfSHd5vGCVD7EmwaUQ/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1pN5ASdgkfU9GVona-grgdcxcPPfSHd5vGCVD7EmwaUQ/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #905 - AI Impacts Across Organizations & Startups - Google Docs
Match found in the HTML content.
Transcript content saved to AI Impacts Across Organizations & Startups
title =  Five Things I Did This Week
link =  https://www.thecloudcast.net/2025/03/five-things-i-did-this-week.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Five Things I Did This Week
Transcript URL: https://docs.google.com/document/d/1ZDwh8yKoZqsnFkeuVHi_QkR7YZASA1E4kRcLoKRBSmE/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1ZDwh8yKoZqsnFkeuVHi_QkR7YZASA1E4kRcLoKRBSmE/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #904 - 5 Things I Did This Week - Google Docs
Match found in the HTML content.
Transcript content saved to Five Things I Did This Week
title =  Cloud & AI News Trends for February 2025
link =  https://www.thecloudcast.net/2025/03/cloud-ai-news-trends-for-february-2025.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Cloud & AI News Trends for February 2025
Transcript tag not found.
transcript_link =  None
title =  Bathing in the Confusion around GenAI
link =  https://www.thecloudcast.net/2025/03/bathing-in-confusion-around-genai.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Bathing in the Confusion around GenAI
Transcript URL: https://docs.google.com/document/d/1StsmMw28qldpGVbWycPy_AOb8bZ72SS7Z2koi4VJgvY/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1StsmMw28qldpGVbWycPy_AOb8bZ72SS7Z2koi4VJgvY/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #902 - Bathing in the Confusion around GenAI - Google Docs
Match found in the HTML content.
Transcript content saved to Bathing in the Confusion around GenAI
title =  Developer Assitance with Coding Co-Pilots
link =  https://www.thecloudcast.net/2025/02/coding-co-pilots.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Developer Assitance with Coding Co-Pilots
Transcript tag not found.
transcript_link =  None
title =  What is your industry's DeepSeek moment?
link =  https://www.thecloudcast.net/2025/02/what-is-your-industrys-deepseek-moment.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: What is your industry's DeepSeek moment?
Transcript URL: https://docs.google.com/document/d/11if-lysqH23-iRtGyx2jZW17R433vdoe58pLPi1SgR4/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/11if-lysqH23-iRtGyx2jZW17R433vdoe58pLPi1SgR4/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #900 - What is your industry's Deepseek moment? - Google Docs
Match found in the HTML content.
Transcript content saved to What is your industry's DeepSeek moment?
title =  VMware Migrations
link =  https://www.thecloudcast.net/2025/02/vmware-migrations.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: VMware Migrations
Transcript tag not found.
transcript_link =  None
title =  How will AI impact your IT budget?
link =  https://www.thecloudcast.net/2025/02/how-will-ai-impact-your-it-budget.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: How will AI impact your IT budget?
Transcript URL: https://docs.google.com/document/d/16JBDoLwQ_hwuExN9SUcel76dKhqoUPyUCp8AqsGketI/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/16JBDoLwQ_hwuExN9SUcel76dKhqoUPyUCp8AqsGketI/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #898 - How wil AI impact your IT budget? - Google Docs
Match found in the HTML content.
Transcript content saved to How will AI impact your IT budget?
title =  The Path to Tech Executive Roles
link =  https://www.thecloudcast.net/2025/02/the-path-to-tech-executive.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: The Path to Tech Executive Roles
Transcript tag not found.
transcript_link =  None
title =  Welcome to the Bi-Modal Cloud Era
link =  https://www.thecloudcast.net/2025/02/welcome-to-bi-modal-cloud-era.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Welcome to the Bi-Modal Cloud Era
Transcript URL: https://docs.google.com/document/d/15D3SiWUYuPMyqsochx3I91ZPruyo0zFQdM260iVzB0E/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/15D3SiWUYuPMyqsochx3I91ZPruyo0zFQdM260iVzB0E/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #896 - Welcome to the Bi-Modal Cloud Era - Google Docs
Match found in the HTML content.
Transcript content saved to Welcome to the Bi-Modal Cloud Era
title =  Cloud & AI News of the Month - January 2025
link =  https://www.thecloudcast.net/2025/02/the-cloudcast-895-cloud-news-of-month.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Cloud & AI News of the Month - January 2025
Transcript tag not found.
transcript_link =  None
title =  Shut up and write code!
link =  https://www.thecloudcast.net/2025/02/shut-up-and-write-code.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Shut up and write code!
Transcript URL: https://docs.google.com/document/d/1a3zLITAZMdIhMUNWDu7xr-EKc8aYSJ5OY-q2Z0oOkZs/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1a3zLITAZMdIhMUNWDu7xr-EKc8aYSJ5OY-q2Z0oOkZs/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #894 - Shut up and write code! - Google Docs
Match found in the HTML content.
Transcript content saved to Shut up and write code!
title =  Modernizing Video Production with AI
link =  https://www.thecloudcast.net/2025/01/modernizing-video-production-with-ai.html


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: The Cloudcast: Modernizing Video Production with AI
Transcript URL: https://docs.google.com/document/d/1N5QKXcJclRCwKPKW4sProy67Xxby2_euKaoEbT8nS4A/edit?usp=sharing
transcript_link =  https://docs.google.com/document/d/1N5QKXcJclRCwKPKW4sProy67Xxby2_euKaoEbT8nS4A/edit?usp=sharing


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


browser =  <Browser type=<BrowserType name=chromium executable_path=/Users/mahadevgaonkar/Library/Caches/ms-playwright/chromium-1161/chrome-mac/Chromium.app/Contents/MacOS/Chromium> version=134.0.6998.35>
page =  <Page url='about:blank'>
page title: [TRANSCRIPT] The Cloudcast #893 - Modernizing Video Production with AI - Google Docs
Match found in the HTML content.
Transcript content saved to Modernizing Video Production with AI
