In [1]:
from langchain_community.document_loaders.text import TextLoader

story = TextLoader("story.txt", encoding="utf-8")

story.load()

[Document(metadata={'source': 'story.txt'}, page_content='The Whispering Grove\n\nIn the heart of the Elderwood Forest, where ancient oaks stretched their gnarled branches toward the starlit sky, young Lyra discovered a grove that shimmered with an otherworldly light. The trees here were different—their bark gleamed like silver, and their leaves sang soft melodies when touched by the evening breeze.\n\nAs she stepped into the clearing, the ground beneath her feet began to glow with ethereal runes, pulsing in rhythm with her heartbeat. At the center of the grove stood a crystalline fountain, its waters flowing upward in defiance of nature\'s laws, forming spiraling ribbons of liquid starlight.\n\n"Welcome, child of two worlds," whispered a voice that seemed to come from the very air itself.\n\nLyra turned to see a figure emerging from behind the largest tree—an elf with eyes like captured moonbeams and hair that flowed like liquid silver. She wore robes woven from spider silk and mornin

In [2]:
# Install required packages for PDF generation
import subprocess
import sys

def install_package(package):
    subprocess.check_call([sys.executable, "-m", "pip", "install", package])

try:
    from reportlab.pdfgen import canvas
    from reportlab.lib.pagesizes import letter
    from reportlab.lib.styles import getSampleStyleSheet
    from reportlab.platypus import SimpleDocTemplate, Paragraph, Spacer
except ImportError:
    print("Installing reportlab...")
    install_package("reportlab")
    from reportlab.pdfgen import canvas
    from reportlab.lib.pagesizes import letter
    from reportlab.lib.styles import getSampleStyleSheet
    from reportlab.platypus import SimpleDocTemplate, Paragraph, Spacer

print("PDF generation libraries ready!")

Installing reportlab...
Collecting reportlab
  Downloading reportlab-4.4.2-py3-none-any.whl.metadata (1.8 kB)
Collecting pillow>=9.0.0 (from reportlab)
  Downloading pillow-11.3.0-cp313-cp313-macosx_11_0_arm64.whl.metadata (9.0 kB)
Downloading reportlab-4.4.2-py3-none-any.whl (2.0 MB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m2.0/2.0 MB[0m [31m9.6 MB/s[0m eta [36m0:00:00[0ma [36m0:00:01[0m
[?25hDownloading pillow-11.3.0-cp313-cp313-macosx_11_0_arm64.whl (4.7 MB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m4.7/4.7 MB[0m [31m19.8 MB/s[0m eta [36m0:00:00[0ma [36m0:00:01[0m
[?25hInstalling collected packages: pillow, reportlab
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m2/2[0m [reportlab]/2[0m [reportlab]
[1A[2KSuccessfully installed pillow-11.3.0 reportlab-4.4.2
PDF generation libraries ready!


In [3]:
# Latest GenAI Models Data (as of July 2025)
genai_models = {
    "GPT-4o": {
        "owner": "OpenAI",
        "description": "Advanced multimodal AI model capable of processing text, images, and audio with superior reasoning capabilities. Features improved efficiency and reduced costs compared to GPT-4.",
        "release_date": "May 2024",
        "capabilities": ["Text generation", "Image understanding", "Audio processing", "Code generation", "Mathematical reasoning"]
    },
    "Claude 3.5 Sonnet": {
        "owner": "Anthropic",
        "description": "Anthropic's most capable model with enhanced reasoning, coding abilities, and improved safety features. Excels at complex analysis and creative tasks.",
        "release_date": "June 2024", 
        "capabilities": ["Advanced reasoning", "Code generation", "Creative writing", "Analysis", "Safety-focused responses"]
    },
    "Gemini Ultra": {
        "owner": "Google",
        "description": "Google's most advanced AI model with multimodal capabilities, excelling in complex reasoning tasks and integration with Google services.",
        "release_date": "February 2024",
        "capabilities": ["Multimodal processing", "Complex reasoning", "Google integration", "Real-time information", "Code understanding"]
    },
    "LLaMA 3": {
        "owner": "Meta",
        "description": "Open-source large language model with strong performance across various tasks. Available in multiple sizes with improved efficiency.",
        "release_date": "April 2024",
        "capabilities": ["Open source", "Multilingual", "Code generation", "Reasoning", "Customizable fine-tuning"]
    },
    "o1-preview": {
        "owner": "OpenAI",
        "description": "OpenAI's reasoning-focused model designed for complex problem-solving, mathematics, and scientific research with extended thinking time.",
        "release_date": "September 2024",
        "capabilities": ["Advanced reasoning", "Mathematics", "Scientific analysis", "Complex problem solving", "Chain-of-thought processing"]
    },
    "Mistral Large": {
        "owner": "Mistral AI",
        "description": "European AI company's flagship model with strong multilingual capabilities and focus on efficiency and safety.",
        "release_date": "February 2024",
        "capabilities": ["Multilingual", "Efficient processing", "Code generation", "Safety features", "European data compliance"]
    }
}

print(f"Loaded information for {len(genai_models)} GenAI models")

Loaded information for 6 GenAI models


In [4]:
# Generate PDF with GenAI Models Information
from datetime import datetime

def create_genai_models_pdf():
    filename = "latest_genai_models_2025.pdf"
    doc = SimpleDocTemplate(filename, pagesize=letter)
    story = []
    styles = getSampleStyleSheet()
    
    # Title
    title = Paragraph("Latest Generative AI Models - 2025", styles['Title'])
    story.append(title)
    story.append(Spacer(1, 12))
    
    # Subtitle
    subtitle = Paragraph(f"Comprehensive Overview - Updated {datetime.now().strftime('%B %Y')}", styles['Heading2'])
    story.append(subtitle)
    story.append(Spacer(1, 24))
    
    # Introduction
    intro_text = """
    This document provides an overview of the latest and most significant generative AI models 
    as of 2025. Each model represents cutting-edge advancements in artificial intelligence, 
    offering unique capabilities and applications across various domains.
    """
    intro = Paragraph(intro_text, styles['Normal'])
    story.append(intro)
    story.append(Spacer(1, 20))
    
    # Model details
    for model_name, details in genai_models.items():
        # Model name as heading
        model_heading = Paragraph(f"<b>{model_name}</b>", styles['Heading2'])
        story.append(model_heading)
        story.append(Spacer(1, 6))
        
        # Owner
        owner_text = f"<b>Owner:</b> {details['owner']}"
        owner_para = Paragraph(owner_text, styles['Normal'])
        story.append(owner_para)
        story.append(Spacer(1, 6))
        
        # Release date
        date_text = f"<b>Release Date:</b> {details['release_date']}"
        date_para = Paragraph(date_text, styles['Normal'])
        story.append(date_para)
        story.append(Spacer(1, 6))
        
        # Description
        desc_text = f"<b>Description:</b> {details['description']}"
        desc_para = Paragraph(desc_text, styles['Normal'])
        story.append(desc_para)
        story.append(Spacer(1, 6))
        
        # Capabilities
        capabilities_text = f"<b>Key Capabilities:</b> {', '.join(details['capabilities'])}"
        cap_para = Paragraph(capabilities_text, styles['Normal'])
        story.append(cap_para)
        story.append(Spacer(1, 18))
    
    # Footer
    footer_text = """
    <i>Note: This information is current as of July 2025. The AI landscape evolves rapidly, 
    and new models and updates are released frequently. For the most current information, 
    please consult the respective companies' official documentation.</i>
    """
    footer = Paragraph(footer_text, styles['Normal'])
    story.append(Spacer(1, 20))
    story.append(footer)
    
    # Build PDF
    doc.build(story)
    print(f"PDF created successfully: {filename}")
    return filename

# Create the PDF
pdf_filename = create_genai_models_pdf()
print(f"Generated PDF file: {pdf_filename}")

PDF created successfully: latest_genai_models_2025.pdf
Generated PDF file: latest_genai_models_2025.pdf


In [20]:

from langchain_community.document_loaders import PyPDFLoader
pdf_filename = "latest_genai_models_2025.pdf"
pdf_data = PyPDFLoader(pdf_filename)
pdf_data.load()



[Document(metadata={'producer': 'ReportLab PDF Library - www.reportlab.com', 'creator': '(unspecified)', 'creationdate': '2025-07-16T17:26:44+05:00', 'author': '(anonymous)', 'keywords': '', 'moddate': '2025-07-16T17:26:44+05:00', 'subject': '(unspecified)', 'title': '(anonymous)', 'trapped': '/False', 'source': 'latest_genai_models_2025.pdf', 'total_pages': 2, 'page': 0, 'page_label': '1'}, page_content="Latest Generative AI Models - 2025\nComprehensive Overview - Updated July 2025\nThis document provides an overview of the latest and most significant generative AI models as of 2025.\nEach model represents cutting-edge advancements in artificial intelligence, offering unique capabilities\nand applications across various domains.\nGPT-4o\nOwner: OpenAI\nRelease Date: May 2024\nDescription: Advanced multimodal AI model capable of processing text, images, and audio with\nsuperior reasoning capabilities. Features improved efficiency and reduced costs compared to GPT-4.\nKey Capabilities: 

In [24]:
from langchain_community.document_loaders import WebBaseLoader
url = "https://cloudenginelabs.io"
web_data = WebBaseLoader(url)
web_data.load()

[Document(metadata={'source': 'https://cloudenginelabs.io', 'title': 'CloudEngine Labs', 'description': 'Cloud & DevOps Automation, Technical Content, and Software Development services.', 'language': 'en'}, page_content='CloudEngine LabsCloudEngine Labs IconCloudEngine Labs®ServicesProductsTestimonialsTrainingContactToggle themeBuild, Automate, and Scale Applications with CloudEngine Labs®Your expert partner for Cloud & DevOps automation, Technical content creation, & Bespoke software development.Our ServicesOur ProductsTake Quick Automation AssessmentContact UsWhat We OfferExpert services designed to accelerate your innovation and growth.Cloud & DevOps AutomationCI/CD Pipeline ImplementationInfrastructure as Code (IaC)Cloud Migration & ManagementContainerization & OrchestrationTechnical Content CreationEngaging Blog Posts & ArticlesIn-depth WhitepapersClear & Concise DocumentationVideo Tutorials & DemosSoftware DevelopmentCustom Web ApplicationsAPI Development & IntegrationCloud-Nativ