In [10]:
import pandas as pd 
import os
from pathlib import Path
from dotenv import load_dotenv

#Local
from config import Config
from data_processing import data_processing
from utils import remove_dirs, check_and_create_dirs
from question_generator import question_generator

#Setting
pd.set_option('display.max_colwidth', None)

#CONFIG
load_dotenv()
api_key = os.getenv("PERPLEXITY_API_KEY")

cfg = Config(
    project_name="session_1",
    input_dir="data",
    api_key= api_key,
    n_questions_per_file=1,
    n_page_summary=3,
    chunk_size=5000,
    chunk_overlap=500
)

# remove_dirs(cfg) # This will delete the output directories if they exist
check_and_create_dirs(cfg)


Folder 'session_1' and 'session_1\chunks' has been created.


In [11]:
data_processing(api_key, cfg)

Processing file: 2024-amazon-annual-report-10K.pdf 1/10
Saving chunks to session_1\chunks\2024-amazon-annual-report-10K.json
Saving metadata to session_1\metadata.json
Processing file: 2024-apple-annual-report-10K.pdf 2/10
Saving chunks to session_1\chunks\2024-apple-annual-report-10K.json
Saving metadata to session_1\metadata.json
Processing file: 2024-cisco-full-annual-report.pdf 3/10
Saving chunks to session_1\chunks\2024-cisco-full-annual-report.json
Saving metadata to session_1\metadata.json
Processing file: 2024-google-annual-report-10K.pdf 4/10
Saving chunks to session_1\chunks\2024-google-annual-report-10K.json
Saving metadata to session_1\metadata.json
Processing file: 2024-meta-full-annual-report.pdf 5/10
Saving chunks to session_1\chunks\2024-meta-full-annual-report.json
Saving metadata to session_1\metadata.json
Processing file: 2024-netflix-annual-report-10K.pdf 6/10
Saving chunks to session_1\chunks\2024-netflix-annual-report-10K.json
Saving metadata to session_1\metadata

In [12]:
df = question_generator(cfg)

Generating 1 question for file: 2024-amazon-annual-report-10K.pdf. 1/10
Generating 1 question for file: 2024-apple-annual-report-10K.pdf. 2/10
Generating 1 question for file: 2024-cisco-full-annual-report.pdf. 3/10
Generating 1 question for file: 2024-google-annual-report-10K.pdf. 4/10
Generating 1 question for file: 2024-meta-full-annual-report.pdf. 5/10
Generating 1 question for file: 2024-netflix-annual-report-10K.pdf. 6/10
Generating 1 question for file: 2024-nvidia-annual-report-10K.pdf. 7/10
Generating 1 question for file: 2024-oracle-annual-report-10K.pdf. 8/10
Generating 1 question for file: 2024-reddit-annual-report-10K.pdf. 9/10
Generating 1 question for file: 2024-tsla-annual-report-10K.pdf. 10/10
Questions saved to session_1\questions.csv


In [13]:
df['question'].head()

0                                                                                                                                                                                                             What types of financial statements are included in Amazon's 2024 financial report, as outlined in the document's index to consolidated financial statements?
1                                                                                                                                                                       What forward-looking statements are included in Apple Inc.'s Form 10-K for the fiscal year ended September 28, 2024, and how do they relate to potential future impacts on the company's business?
2    Based on the provided chunk regarding Cisco Systems’ fiscal year 2024 report, here is a question generated according to your requirements:\n\n**How did Cisco Systems’ management and principal officers assess the effectiveness of the company’s disclosure controls and pr

## MODEL 1

In [14]:
from user_models.example_1.model import run_qa_pipeline
from user_models.createplot import plot
from user_models.example_1.qa import create_chain
from user_models.evaluate import evaluate_answer

In [15]:
MODEL_1_CONFIG = {
    "model_name": "model_1",
    "model_type": "faiss",
    
    # Data paths
    "pdf_folder": "./data",
    "vector_store_path": "faiss_index_open",
    "questions_file": "session_1/questions.csv",
    "log_file": "qa_log_1.csv",
    "final_output_file": "final_1.csv",
    
    # Text processing
    "chunk_size": 5000,
    "chunk_overlap": 500,
    "text_splitter_type": "recursive",  # "recursive" or "token"
    "document_loader": "pymupdf",  # "pymupdf" or "pypdf"
    
    # Embeddings
    "embedding_model": "sentence-transformers/all-mpnet-base-v2",
    "embedding_type": "huggingface",
    "embedding_device": "cpu",
    "normalize_embeddings": False,
    
    # LLM settings
    "llm_model": "sonar",
    "pplx_api_key": "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",
    "temperature": 0.2,
    
    # Retrieval settings
    "retriever_k": 3,
    "use_compression": False,
    "use_custom_prompt": False,
    
    # Processing settings
    "recreate_vector_store": False,
    "max_retries": 3
}

# Model 2 Configuration (Chroma + BGE Embeddings + Compression)
MODEL_2_CONFIG = {
    "model_name": "model_2",
    "model_type": "chroma",
    
    # Data paths
    "pdf_folder": "./data",
    "vector_store_path": "chroma_index_finance",
    "questions_file": "session_1/questions.csv",
    "log_file": "qa_log_2.csv",
    "final_output_file": "final_2.csv",
    
    # Text processing
    "chunk_size": 5000,
    "chunk_overlap": 500,
    "text_splitter_type": "token",
    "document_loader": "pypdf",
    
    # Embeddings
    "embedding_model": "BAAI/bge-base-en",
    "embedding_type": "bge",
    "embedding_device": "cpu",
    "normalize_embeddings": True,
    
    # LLM settings
    "llm_model": "sonar",
    "pplx_api_key": "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",
    "temperature": 0.2,
    
    # Retrieval settings
    "retriever_k": 5,
    "use_compression": True,
    "use_custom_prompt": True,
    "custom_prompt": """
    You are a professional financial advisor with expertise in corporate finance, investment analysis, and career development in finance-related roles.

    Use only the information provided in the context to answer the user's question.
    Do not make assumptions or fabricate any details.

    Respond clearly and professionally, as if advising a client on their financial career or investment decisions.

    {context}

    Question: {question}

    If the answer is not explicitly stated in the context, respond with: "I don't know based on the provided document".
    """,
    
    # Processing settings
    "recreate_vector_store": False,
    "max_retries": 3
}

In [16]:
from user_models.qa import create_unified_chain
from user_models.model import run_qa_pipeline
from user_models.evaluate import evaluate_answer
from user_models.createplot import plot

def run_model_experiment(config, experiment_name=""):
    """Run experiment with given configuration"""
    
    print(f"\n{'='*50}")
    print(f"Running {experiment_name or config['model_name']} Experiment")
    print(f"{'='*50}")
    
    # Create QA chain
    qa_chain = create_unified_chain(config)
    
    # Run pipeline
    df, final_df = run_qa_pipeline(
        qa_chain=qa_chain,
        questions_file=config["questions_file"],
        log_file=config["log_file"],
        final_output_file=config["final_output_file"],
        evaluate_answer_func=evaluate_answer,
        max_retries=config["max_retries"]
    )
    
    # Create plots
    try:
        plot(final_df)
        print(f"Plots created successfully for {config['model_name']}")
    except Exception as e:
        print(f"Error creating plots for {config['model_name']}: {e}")
    
    return df, final_df

In [23]:
# Run Model 1 (FAISS + HuggingFace)
df1, final_df1 = run_model_experiment(MODEL_1_CONFIG, "Model 1 (FAISS)")
    
# Run Model 2 (Chroma + BGE + Compression)
df2, final_df2 = run_model_experiment(MODEL_2_CONFIG, "Model 2 (Chroma)")


Running Model 1 (FAISS) Experiment
Loading existing vector store for model_1...
Vector store loaded from: faiss_index_open
Using standard retriever
QA chain created successfully for model_1
=== Starting QA Pipeline ===
Cleared existing log file: qa_log_1.csv
Processing 10 questions from session_1/questions.csv
Processing question 1/10: What types of financial statements are included in...
Processing question 2/10: What forward-looking statements are included in Ap...
Processing question 3/10: Based on the provided chunk regarding Cisco System...
Processing question 4/10: How do evolving and uncertain regulations in areas...
Processing question 5/10: How does Meta Platforms, Inc. address the limitati...
Processing question 6/10: What exhibits related to Netflix, Inc.’s fiscal ye...
Processing question 7/10: How have new US export control restrictions in 202...
Processing question 8/10: What were the key components and figures of Oracle...
Processing question 9/10: What risks does Reddi

Plots created successfully for model_1

Running Model 2 (Chroma) Experiment
Loading existing vector store for model_2...



The class `Chroma` was deprecated in LangChain 0.2.9 and will be removed in 1.0. An updated version of the class exists in the :class:`~langchain-chroma package and should be used instead. To use it run `pip install -U :class:`~langchain-chroma` and import as `from :class:`~langchain_chroma import Chroma``.



Vector store loaded from: chroma_index_finance
Using compression retriever
Using custom prompt template
QA chain created successfully for model_2
=== Starting QA Pipeline ===
Cleared existing log file: qa_log_2.csv
Processing 10 questions from session_1/questions.csv
Processing question 1/10: What types of financial statements are included in...
Processing question 2/10: What forward-looking statements are included in Ap...
Processing question 3/10: Based on the provided chunk regarding Cisco System...
Processing question 4/10: How do evolving and uncertain regulations in areas...
Processing question 5/10: How does Meta Platforms, Inc. address the limitati...
Processing question 6/10: What exhibits related to Netflix, Inc.’s fiscal ye...
Processing question 7/10: How have new US export control restrictions in 202...
Processing question 8/10: What were the key components and figures of Oracle...
Processing question 9/10: What risks does Reddit, Inc. identify in its 2024 ...
Processing q

Plots created successfully for model_2


In [21]:
final_df1.head(10)

Unnamed: 0,question,top_k_chunk,answer,evaluation_error,evaluation_factual_correctness_score,evaluation_completeness_score,evaluation_clarity_score,evaluation_comments
0,"What types of financial statements are included in Amazon's 2024 financial report, as outlined in the document's index to consolidated financial statements?",13; 62; 107,"Amazon's 2024 financial report includes the following types of financial statements as outlined in the index to consolidated financial statements:\n\n- **Consolidated Statements of Cash Flows**: These statements detail the inflows and outflows of cash and cash equivalents over the three years ended December 31, 2024.\n- **Consolidated Statements of Operations**: These statements provide a detailed breakdown of Amazon's revenues and expenses for each of the three years ended December 31, 2024.\n- **Consolidated Statements of Comprehensive Income (Loss)**: These statements include net income and other comprehensive income items such as foreign currency translation adjustments and unrealized gains or losses on available-for-sale debt securities for each of the three years ended December 31, 2024.\n- **Consolidated Balance Sheets**: These statements present Amazon's financial position at the end of the years 2023 and 2024.\n- **Consolidated Statements of Stockholders’ Equity**: These statements show changes in stockholders' equity over the three years ended December 31, 2024.\n- **Notes to Consolidated Financial Statements**: These provide additional details and explanations for the financial statements.\n- **Report of Ernst & Young LLP, Independent Registered Public Accounting Firm**: This includes the auditor's opinion on the fairness and accuracy of the financial statements.",Expecting value: line 1 column 1 (char 0),,,,
1,"What forward-looking statements are included in Apple Inc.'s Form 10-K for the fiscal year ended September 28, 2024, and how do they relate to potential future impacts on the company's business?",120; 115; 114,"Apple Inc.'s Form 10-K for the fiscal year ended September 28, 2024, includes forward-looking statements primarily in **Part I, Item 1** under the heading “Business” and **Part II, Item 7** under the heading “Management’s Discussion and Analysis of Financial Condition and Results of Operations.” These statements involve risks and uncertainties and provide current expectations of future events based on certain assumptions. They include discussions about the potential future impact of macroeconomic conditions on the company's business and results of operations.\n\n### Key Forward-Looking Statements and Their Implications\n\n1. **Macroeconomic Conditions**: Statements regarding how global and regional economic conditions, such as slow growth, recession, inflation, and currency fluctuations, could affect consumer confidence and demand for Apple's products and services. These conditions can also impact suppliers, contract manufacturers, and other partners, potentially leading to financial instability and reduced liquidity[1][3].\n\n2. **Risk Factors**: The discussion in **Item 1A** highlights various risks that could impact Apple's business, including macroeconomic risks, industry risks, and operational challenges. These risks are forward-looking as they discuss potential future impacts on the company's performance and financial condition[1].\n\n3. **Future Performance**: Forward-looking statements caution that past financial performance should not be considered a reliable indicator of future results. This reflects the uncertainty and variability in future outcomes due to factors like economic conditions and market trends[1].\n\nThese forward-looking statements are not guarantees of future performance, and actual results may differ significantly due to various factors discussed in the report, particularly in the risk factors section. Apple assumes no obligation to revise or update these statements except as required by law[1].",,5.0,5.0,5.0,"The answer accurately identifies the sections with forward-looking statements, discusses their content and implications, and aligns fully with the referenced document chunk and relevant SEC filings[1][2][3]."
2,"Based on the provided chunk regarding Cisco Systems’ fiscal year 2024 report, here is a question generated according to your requirements:\n\n**How did Cisco Systems’ management and principal officers assess the effectiveness of the company’s disclosure controls and procedures for fiscal year 2024, and what was their conclusion regarding those controls?**",255; 347; 352,"Cisco Systems’ management, including the principal executive officer and principal financial officer, assessed the effectiveness of the company’s disclosure controls and procedures for fiscal year 2024 by conducting an evaluation based on the framework in Internal Control—Integrated Framework (2013) issued by the Committee of Sponsoring Organizations of the Treadway Commission (COSO). Their assessment included a review of the design and operating effectiveness of internal control over financial reporting, with the oversight of the Board of Directors.\n\nManagement concluded that Cisco’s internal control over financial reporting was effective as of July 27, 2024. This conclusion was reached after excluding the internal controls of Splunk Inc., which Cisco acquired during the year, in accordance with SEC guidance that permits exclusion of acquisitions from the assessment for up to one year from the date of acquisition. Splunk’s assets and revenues represented approximately 3% of Cisco’s consolidated totals for the year[5].\n\nThe independent registered public accounting firm, PricewaterhouseCoopers LLP, also audited Cisco’s internal control over financial reporting and concurred with management’s conclusion, issuing an unqualified opinion that Cisco maintained effective internal control over financial reporting as of July 27, 2024[5].",,5.0,5.0,5.0,"The answer accurately reflects the information from the provided document chunk, detailing the management's assessment process, the framework used (COSO 2013), the exclusion of Splunk Inc. in the evaluation per SEC guidance, and the conclusion that Cisco's internal control over financial reporting was effective as of July 27, 2024. It also correctly states PricewaterhouseCoopers LLP's concurring audit opinion. The response fully answers the question clearly and precisely."
3,"How do evolving and uncertain regulations in areas such as AI, competition, consumer protection, content moderation, data privacy, news, and sustainability impact Alphabet Inc.'s business operations and risks, particularly as reported for the fiscal year ended December 31, 2024?",806; 451; 469,"Evolving and uncertain regulations in areas such as AI, competition, consumer protection, content moderation, data privacy, news, and sustainability have significant impacts on Alphabet Inc.’s business operations and risk profile, as highlighted in its 2024 fiscal year reporting and recent regulatory developments.\n\n## Regulatory Impact on Business Operations\n\n**Compliance Costs and Operational Complexity**\n\nAlphabet faces a growing burden of compliance with a wide array of new and changing laws across multiple jurisdictions. These include regulations on data privacy (such as the EU’s Digital Services Act and AI Act), competition and antitrust (including ongoing probes by the U.S. Department of Justice and European regulators), consumer protection, content moderation, and sustainability. Compliance is costly and complex, especially as regulations often differ or conflict between regions, requiring Alphabet to adapt its operations and policies in each market[5]. The company notes that these costs are likely to increase as regulatory scrutiny intensifies and new laws are enacted.\n\n**Antitrust and Competition Risks**\n\nAlphabet is under heightened antitrust scrutiny, particularly regarding its AI-related activities. For example, the U.S. Justice Department is investigating Alphabet’s 2024 deal with AI startup Character.AI, focusing on whether the arrangement unfairly concentrates AI talent and technology and stifles competition. Regulators are concerned that such deals may limit access to cutting-edge AI tools and expertise for rivals, potentially harming innovation and market competition[1][4]. Similar investigations are ongoing in the EU and UK, where regulators are examining Alphabet’s investments, partnerships, and supply of AI-related hardware and software.\n\n**Data Privacy and Content Moderation**\n\nNew and evolving data privacy laws, such as the EU’s Digital Services Act and proposed U.S. legislation like the American Privacy Rights Act, impose strict requirements on how Alphabet collects, uses, and shares user data. Non-compliance can result in significant fines—up to 6% of global revenue in the EU—and reputational damage[4]. Content moderation regulations also require Alphabet to monitor and manage harmful or illegal content, which increases operational costs and exposes the company to liability if it fails to meet regulatory standards.\n\n**AI and Emerging Technologies**\n\nRegulators are increasingly focused on the responsible development and deployment of AI. Alphabet’s leadership in AI has attracted scrutiny from regulators worldwide, who are considering restrictions on the hardware, software, and systems used to develop advanced AI models. Such restrictions could increase costs, delay product launches, and reduce the number of new customers, negatively impacting Alphabet’s business and financial results[5]. The company also faces reputational risks if AI systems produce harmful or inaccurate content.\n\n**Sustainability and Environmental Regulations**\n\nAlphabet is subject to environmental, health, and safety regulations, including those related to sustainability. Compliance with these regulations can affect the company’s supply chain, manufacturing processes, and product offerings, and may require additional investments in sustainable practices.\n\n## Financial and Strategic Risks\n\n**Revenue and Margin Pressures**\n\nAlphabet’s core revenue comes from online advertising, which is sensitive to regulatory changes affecting data privacy, advertising practices, and content moderation. New regulations can limit the effectiveness of targeted advertising, reduce advertiser demand, and increase compliance costs, putting pressure on margins[2][5]. The shift to new advertising formats and devices, while offering growth opportunities, also tends to have lower margins than traditional desktop search.\n\n**Market and Operational Risks**\n\nAlphabet’s global operations expose it to risks from geopolitical tensions, trade restrictions, and foreign exchange fluctuations. Government actions, such as tariffs, export controls, and sanctions, can disrupt supply chains, delay shipments, and increase costs[5]. The company’s reliance on third-party suppliers and manufacturers further amplifies these risks.\n\n**Reputational and Legal Risks**\n\nViolations of laws or regulatory requirements can result in fines, criminal sanctions, business restrictions, and reputational harm. Alphabet acknowledges that even inadvertent violations by employees, contractors, or partners could have material adverse effects on its business[5].\n\n## Summary Table: Key Regulatory Risks and Impacts\n\n| Regulatory Area | Impact on Alphabet Inc. |\n|------------------------|-------------------------------------------------------------|\n| AI | Increased scrutiny, compliance costs, delayed product launches, reputational risks[1][5] |\n| Competition/Antitrust | Probes, potential restrictions on deals, higher compliance costs, risk of fines[1][4] |\n| Data Privacy | Stricter rules, higher compliance costs, risk of fines, reputational damage[4][5] |\n| Content Moderation | Increased monitoring costs, liability for harmful content[5] |\n| Consumer Protection | Compliance costs, restrictions on business practices[5] |\n| News | Regulatory oversight, content moderation requirements[5] |\n| Sustainability | Compliance costs, supply chain impacts, investment needs[5] |\n\n## Conclusion\n\nEvolving and uncertain regulations in AI, competition, consumer protection, content moderation, data privacy, news, and sustainability present significant operational, financial, and reputational risks for Alphabet Inc. The company faces rising compliance costs, increased regulatory scrutiny, and potential restrictions on its business activities, all of which could negatively impact its financial results and competitive position in the digital economy[5][1][4].",,5.0,5.0,5.0,"The answer aligns well with the document chunk, accurately describing the impact of evolving regulations on Alphabet Inc.'s operations and risks for fiscal year 2024, including compliance costs, antitrust scrutiny, data privacy, AI, sustainability, and financial risks, all supported by the referenced documents. The presentation is thorough, clearly structured, and covers all relevant regulatory areas mentioned in the question."
4,"How does Meta Platforms, Inc. address the limitations and risks associated with forward-looking statements and the use of non-GAAP financial measures in its financial results for the fourth quarter and full year 2024?",549; 552; 550,"Meta Platforms, Inc. addresses the limitations and risks associated with forward-looking statements and the use of non-GAAP financial measures in its financial results for the fourth quarter and full year 2024 through several explicit disclosures and methodological clarifications:\n\n## Forward-Looking Statements\n\n- Meta clearly identifies forward-looking statements by using terms such as ""believe,"" ""may,"" ""will,"" ""estimate,"" ""continue,"" ""anticipate,"" ""intend,"" and ""expect"" to signal predictions about future events or results[1].\n\n- These statements are subject to numerous assumptions, risks, and uncertainties that could cause actual outcomes to differ materially from those expressed or implied. Meta references detailed risk factors and limitations in its filings with the Securities and Exchange Commission (SEC), specifically in sections like ""Risk Factors,"" ""Limitations of Key Metrics and Other Data,"" and ""Management's Discussion and Analysis of Financial Condition and Results of Operations"" in its Annual Report on Form 10-K and Quarterly Report on Form 10-Q[1][2][4].\n\n- Meta emphasizes that forward-looking statements speak only as of the date they are made and disclaims any obligation to update or revise these statements in the future, including archived materials which are provided solely for reference[1].\n\n- During earnings calls, Meta reiterates that actual results may differ materially from forward-looking statements, reinforcing the caution investors should exercise[5].\n\n## Non-GAAP Financial Measures\n\n- Meta adjusts its non-GAAP financial measures to provide supplemental information that it believes helps investors better understand underlying business trends. For example, it adjusts revenue for foreign exchange effects by translating revenue using prior year's exchange rates to facilitate comparison with historical performance[3].\n\n- In calculating free cash flow, Meta subtracts both purchases of property and equipment and principal payments on finance leases, considering these collectively as the capital expenditures needed to support the business regardless of financing method. This approach aims to provide a clearer picture of the company's capital investment trends[3].\n\n- Meta explicitly states that non-GAAP measures are not intended to represent residual cash flow available for discretionary expenditures, clarifying their purpose and limitations[3].\n\n- The company provides reconciliations of GAAP to non-GAAP measures in its press releases and SEC filings to ensure transparency and allow investors to understand the adjustments made[3].\n\nIn summary, Meta Platforms, Inc. manages the risks and limitations of forward-looking statements by clearly labeling them, disclosing associated risks comprehensively in SEC filings, and disclaiming update obligations. For non-GAAP financial measures, Meta explains its adjustment methodologies, clarifies the intent and limitations of these metrics, and provides reconciliations to GAAP figures to maintain transparency and assist investor understanding[1][2][3][4][5].",,5.0,5.0,5.0,"The answer accurately reflects how Meta Platforms, Inc. addresses forward-looking statements and non-GAAP financial measures by citing specific disclosures, risk factors, disclaimers, and reconciliation practices found in the referenced documents. It comprehensively covers both topics with clear, well-organized explanations directly supported by the search results."
5,"What exhibits related to Netflix, Inc.’s fiscal year ended December 31, 2024, are included in the annual report, and what types of certifications and plans are filed with the SEC as part of this report?",659; 645; 555,"The annual report for Netflix, Inc.'s fiscal year ended December 31, 2024, includes several exhibits and certifications filed with the SEC. Here are some key components:\n\n## Exhibits Included in the Annual Report\n\n1. **Exhibit 10.5**: Amended and Restated Performance Bonus Plan.\n2. **Exhibit 10.6**: Form of Stock Option Agreement under the 2011 Stock Plan.\n3. **Exhibit 10.7**: Form of Stock Option Agreement under the 2020 Stock Plan.\n4. **Exhibit 10.8**: Form of Stock Option Agreement under the 2020 Stock Plan (Options Subject to Vesting).\n5. **Exhibit 10.9**: Netflix, Inc. 2020 Stock Plan Form of Restricted Stock Unit Award Agreement.\n6. **Exhibit 10.10**: Netflix, Inc. 2020 Stock Plan Form of Performance-Based Restricted Stock Unit Award Agreement.\n7. **Exhibit 10.11**: Netflix, Inc. Executive Officer Severance Plan.\n8. **Exhibit 19.1**: Netflix, Inc. Insider Trading Policy.\n9. **Exhibit 21.1**: List of Significant Subsidiaries.\n10. **Exhibit 23.1**: Consent of Ernst & Young LLP.\n11. **Exhibit 31.1, 31.2, 31.3**: Certifications of Co-Chief Executive Officers and Chief Financial Officer Pursuant to Section 302 of the Sarbanes-Oxley Act of 2002.\n12. **Exhibit 32.1**: Certifications of Co-Chief Executive Officers and Chief Financial Officer Pursuant to Section 906 of the Sarbanes-Oxley Act of 2002.\n13. **Exhibit 97.1**: Netflix, Inc. Clawback Policy.\n14. **Exhibit 101**: Financial statements formatted in Inline XBRL.\n15. **Exhibit 104**: Cover page from the Annual Report on Form 10-K, formatted in Inline XBRL.\n\n## Certifications and Plans\n\n- **Section 302 Certifications**: These are certifications by the Co-Chief Executive Officers and the Chief Financial Officer that the report complies with the requirements of the Securities Exchange Act of 1934 and fairly presents the financial condition and results of operations of Netflix, Inc. (Exhibits 31.1, 31.2, 31.3).\n- **Section 906 Certifications**: These are certifications by the Co-Chief Executive Officers and the Chief Financial Officer pursuant to Section 906 of the Sarbanes-Oxley Act of 2002, affirming that the report complies with the Securities Exchange Act of 1934 and fairly presents the financial condition and results of operations (Exhibit 32.1).\n- **Stock Plans and Agreements**: Various stock option agreements and restricted stock unit award agreements are included, which outline compensation plans for executives and employees.\n- **Clawback Policy**: This policy allows Netflix to recover certain compensation from executives under specific circumstances (Exhibit 97.1).\n- **Insider Trading Policy**: This policy governs the trading of Netflix securities by insiders to prevent insider trading violations (Exhibit 19.1).",,3.0,3.0,4.0,"The answer lists exhibits and certifications plausibly present in a major SEC filing, but since the document chunk (pages 659, 645, 555) is not detailed here, actual accuracy is indeterminable; completeness is partial as it makes assumptions not verifiable from the snippet; clarity is good, but structure assumes content not confirmed."
6,"How have new US export control restrictions in 2024 negatively impacted NVIDIA Corporation's competitive position compared to certain competitors, and what specific risks do these controls pose for its future business and results in the China market and beyond?",810; 811; 808,"The new US export control restrictions imposed in 2024 have significantly impacted NVIDIA Corporation’s competitive position, especially in the China market, and introduced several specific risks for its future business and financial results.\n\n## Negative Impact on Competitive Position\n\n- **Disadvantage Against Competitors:** NVIDIA is now at a competitive disadvantage compared to certain competitors whose products are not subject to the same export restrictions or who may more easily obtain licenses. This has led to lost sales and market share in China, a region where NVIDIA reported $17 billion in sales in 2024[5].\n- **Compliance and Licensing Burden:** The management of new licenses and compliance requirements is complex and time-consuming, making NVIDIA’s pre- and post-sale technical support efforts more cumbersome and less certain. This encourages customers in China to seek alternatives, including semiconductor suppliers from China, Europe, and Israel[5].\n- **Product and Market Exclusion:** The US government has imposed indefinite licensing requirements on NVIDIA’s H20 chip sales to China, and similar controls may be extended to other products. This has already resulted in a $5.5 billion write-down due to unsellable inventory and stranded sales[5].\n\n## Specific Risks Posed by Export Controls\n\n- **Loss of Market Access:** Further changes or expansions in export controls could exclude NVIDIA from all or part of the China market, as well as other impacted regions such as the Middle East. This could also affect markets in Europe, Latin America, and Southeast Asia if customers choose to “design-out” US semiconductors to reduce compliance risk[5].\n- **Supply Chain Disruption:** Export controls may disrupt NVIDIA’s supply and distribution chains, particularly for products warehoused in and distributed from Hong Kong. Restrictions on datacenter GPUs could also negatively impact demand for NVIDIA’s networking products used in servers[5].\n- **Product Development and Inventory Risks:** The possibility of new controls being imposed at any time increases the risk that new products may be subject to export restrictions before they reach the market, leading to excess inventory and stranded investments[5].\n- **Customer and End-User Restrictions:** Export controls may subject downstream users to additional restrictions on the use, resale, repair, or transfer of NVIDIA products, further complicating customer relationships and service obligations[5].\n- **Regulatory and Geopolitical Risks:** Increased scrutiny from regulators in China and other regions, as well as potential retaliatory measures, could result in penalties or restrictions on NVIDIA’s ability to conduct business. For example, Chinese regulators have already inquired about NVIDIA’s sales and fulfillment of commitments related to the Mellanox acquisition[5].\n- **Impact on Cloud and AI Services:** Controls could negatively impact NVIDIA’s ability to provide AI cloud services and affect the cost and availability of services for cloud providers and their end customers, even outside China[5].\n- **Investment and Innovation Risks:** The uncertainty created by shifting export controls may discourage investment in NVIDIA’s advanced semiconductor products and encourage investment in foreign competitors less likely to be restricted by US controls[5].\n\n## Summary Table: Key Risks and Impacts\n\n| Risk/Impact Area | Description |\n|----------------------------------|---------------------------------------------------------------------------------------------|\n| Competitive Disadvantage | Competitors not subject to controls gain market share; customers seek alternatives |\n| Compliance Burden | Licensing and management requirements increase costs and complexity |\n| Market Exclusion | Potential loss of access to China and other key markets |\n| Supply Chain Disruption | Disruption of warehousing and distribution, especially in Hong Kong |\n| Product Development Risks | New products may be restricted before launch, leading to stranded inventory |\n| Customer/End-User Restrictions | Additional restrictions on use, resale, repair, or transfer of products |\n| Regulatory/Geopolitical Risks | Increased scrutiny, potential penalties, and retaliatory measures |\n| Cloud/AI Service Impact | Reduced ability to provide and support cloud and AI services |\n| Investment/Innovation Risks | Uncertainty discourages investment in NVIDIA, benefits foreign competitors |\n\n## Conclusion\n\nThe new US export controls have placed NVIDIA at a significant competitive disadvantage, particularly in the China market, and introduced a range of risks that could materially impact its business, revenue, and financial results. The company faces ongoing challenges related to compliance, market access, supply chain stability, and regulatory scrutiny, all of which could be exacerbated by further changes in export control policies[5][3][1].",,4.0,5.0,5.0,"The answer is highly accurate and comprehensive, but a minor factual error exists in the claim of '$17 billion in sales in China in 2024'—no supporting evidence is found in the provided chunks, and the closest validated figure from the chunk refers to projected $12 billion from H20 AI chips[3][5]. The answer otherwise well-covers the risks, competitive impacts, and regulatory issues."
7,"What were the key components and figures of Oracle Corporation's consolidated statements of cash flows for the fiscal year ended May 31, 2024, including net income, operating cash flows, investing activities, and financing activities?",1022; 1016; 1019,"For the fiscal year ended May 31, 2024, Oracle Corporation's consolidated statements of cash flows included the following key components and figures:\n\n**Net Income:**\n- Oracle reported a net income of $10.467 billion for fiscal year 2024[2].\n\n**Cash Flows from Operating Activities:**\n- Net cash provided by operating activities was $18.673 billion, reflecting strong cash generation from core business operations.\n- Key adjustments to reconcile net income to operating cash flow included:\n - Depreciation: $3.129 billion\n - Amortization of intangible assets: $3.010 billion\n - Deferred income taxes (a reduction): $(2.139) billion\n - Stock-based compensation: $3.974 billion\n - Changes in working capital items such as an increase in trade receivables $(965) million and an increase in deferred revenues $656 million also impacted operating cash flow[2].\n\n**Cash Flows from Investing Activities:**\n- Net cash used for investing activities was $(7.360) billion.\n- Major investing cash flows included:\n - Purchases of marketable securities and other investments: $(1.003) billion\n - Proceeds from sales and maturities of marketable securities and other investments: $572 million\n - Acquisitions, net of cash acquired: $(63) million\n - Capital expenditures: $(6.866) billion[2].\n\n**Cash Flows from Financing Activities:**\n- Net cash used for financing activities was $(10.554) billion.\n- Significant financing cash flows included:\n - Payments for repurchases of common stock: $(1.202) billion\n - Proceeds from issuances of common stock: $742 million\n - Shares repurchased for tax withholdings upon vesting of restricted stock-based awards: $(2.040) billion\n - Payments of dividends to stockholders: $(4.391) billion\n - Repayments of senior notes and other borrowings: $(3.500) billion[2].\n\n**Cash and Cash Equivalents:**\n- Cash and cash equivalents at the end of the fiscal year were $10.454 billion, up from $9.765 billion at the beginning of the year[2].\n\nIn summary, Oracle generated strong operating cash flow of $18.7 billion in fiscal 2024, invested $7.4 billion primarily in capital expenditures and securities, and returned significant capital to shareholders through dividends and stock repurchases, resulting in a net cash outflow from financing activities of $10.6 billion[2][1].",Expecting value: line 1 column 1 (char 0),,,,
8,"What risks does Reddit, Inc. identify in its 2024 fiscal year report related to the dependency on its senior management team and key employees, particularly concerning CEO Steven Huffman?",1140; 1121; 1143,"The provided search results and context do not specifically mention risks related to Reddit's dependency on its senior management team, particularly concerning CEO Steven Huffman, in the 2024 fiscal year report. However, the context does discuss general risks related to human capital and culture, which could indirectly involve senior management. For instance, it mentions challenges in managing growth and maintaining corporate culture, which could impact innovation and teamwork[1][5]. If you are looking for specific information about risks related to senior management, it might be necessary to review the full report or additional sources.",Expecting value: line 1 column 1 (char 0),,,,
9,"What was the main reason for the increase in net cash provided by operating activities for Tesla, Inc. during the fiscal year ended December 31, 2024?",1347; 1342; 1334,"The main reason for the increase in net cash provided by operating activities for Tesla, Inc. during the fiscal year ended December 31, 2024, was primarily due to favorable changes in net operating assets and liabilities of $2.29 billion. This increase was partially offset by a decrease in net income excluding non-cash expenses, gains, and losses of $623 million[5]. \n\nIn summary, the improvement in cash flow from operating activities was largely driven by better management of working capital, which includes accounts receivable, inventory, and accounts payable, among other factors. However, the decrease in net income, excluding non-cash items, somewhat mitigated this positive effect.",,2.0,1.0,3.0,"The answer claims the main reason for the increase in net cash from operating activities was due to favorable changes in net operating assets and liabilities of $2.29 billion and a decrease in net income excluding non-cash items by $623 million, but these specific figures and causation are not supported or mentioned in the provided document chunk or search results. The document chunk identifiers (1347; 1342; 1334) are not linked to any concrete data in the search results. The answer also does not align well with the available data showing operating cash flow values but no explicit attribution of increases. The explanation is moderately clear but lacks support and completeness due to missing or unverifiable details."


In [22]:
final_df2.head(10)

Unnamed: 0,question,top_k_chunk,answer,evaluation_factual_correctness_score,evaluation_completeness_score,evaluation_clarity_score,evaluation_comments,evaluation_error
0,"What types of financial statements are included in Amazon's 2024 financial report, as outlined in the document's index to consolidated financial statements?",85; 47; 52; 45; 13,"Based on the provided context, the types of financial statements included in Amazon's 2024 financial report are:\n\n- **Consolidated Statements of Cash Flows** for each of the three years ended December 31, 2024\n- **Consolidated Statements of Operations** for each of the three years ended December 31, 2024\n- **Consolidated Statements of Comprehensive Income (Loss)** for each of the three years ended December 31, 2024\n- **Consolidated Balance Sheets** as of December 31, 2023 and 2024\n- **Consolidated Statements of Stockholders’ Equity** for each of the three years ended December 31, 2024\n\nThese are explicitly mentioned in the context. However, if you are looking for a more detailed index or specific types not listed here, the provided context does not offer additional information beyond these statements.",2.0,2.0,4.0,"The answer lists plausible financial statements, but none of the named statements or years are explicitly supported by the provided context (document chunk: 85; 47; 52; 45; 13), which only contains page numbers without any statement names or contents. The answer is clear but not accurate or complete based on the given chunk.",
1,"What forward-looking statements are included in Apple Inc.'s Form 10-K for the fiscal year ended September 28, 2024, and how do they relate to potential future impacts on the company's business?",120; 345; 454; 93,"Based on the provided information, Apple Inc.'s Form 10-K for the fiscal year ended September 28, 2024, includes forward-looking statements that are typically located in Part I, Item 1 under the heading ""Business"" and Part II, Item 7 under the heading ""Management’s Discussion and Analysis of Financial Condition and Results of Operations"" [1][2]. These statements involve risks and uncertainties, such as the potential future impact of macroeconomic conditions on the company's business and results of operations [1]. Additionally, forward-looking statements may include those about payment of the Company's quarterly dividend and future business plans [4].\n\nHowever, specific details about these forward-looking statements and their relation to potential future impacts on Apple's business are not explicitly outlined in the provided context. Therefore, for detailed insights, it would be necessary to review the actual Form 10-K document. \n\nIn summary, while we know where to find these statements and some general topics they cover, the exact content and implications of these forward-looking statements are not detailed in the provided information.",5.0,4.0,5.0,"The answer correctly identifies where forward-looking statements can be found in Apple Inc.'s Form 10-K and mentions general topics such as macroeconomic risks and dividends, consistent with the provided sources. However, it notes the lack of specific detailed content in the document chunk, making it mostly complete but not fully detailed regarding the statements' explicit content and implications.",
2,"Based on the provided chunk regarding Cisco Systems’ fiscal year 2024 report, here is a question generated according to your requirements:\n\n**How did Cisco Systems’ management and principal officers assess the effectiveness of the company’s disclosure controls and procedures for fiscal year 2024, and what was their conclusion regarding those controls?**",287; 224; 214; 284,I don't know based on the provided document.,5.0,5.0,5.0,"The answer is consistent with the document chunk: no assessment of disclosure controls is found in the provided documents, so stating 'I don't know' is fully correct and clear.",
3,"How do evolving and uncertain regulations in areas such as AI, competition, consumer protection, content moderation, data privacy, news, and sustainability impact Alphabet Inc.'s business operations and risks, particularly as reported for the fiscal year ended December 31, 2024?",652; 347; 345; 353,"Evolving and uncertain regulations in areas such as AI, competition, consumer protection, content moderation, data privacy, news, and sustainability have a significant impact on Alphabet Inc.'s business operations and risk profile, as detailed in its fiscal year 2024 disclosures.\n\n**Key Impacts on Business Operations and Risks**\n\n- **Increased Regulatory Scrutiny and Compliance Costs** \n Alphabet faces heightened regulatory scrutiny from multiple jurisdictions, including the U.S., EU, UK, and China. New and evolving laws—such as the EU AI Act, Digital Markets Act, Digital Services Act, and proposed U.S. privacy legislation—impose substantial compliance obligations. These can increase operational costs, require changes to business practices, and limit the company’s ability to offer certain products or services[4].\n- **Operational and Strategic Challenges** \n The company must navigate a patchwork of regulations that are not always consistent across jurisdictions. This uncertainty can make it difficult to plan and execute global strategies, especially in areas like AI, data privacy, and content moderation. Alphabet may need to modify its business models, restrict certain activities, or delay product launches to comply with new or changing rules[4].\n- **Legal and Financial Risks** \n Alphabet is subject to ongoing investigations, lawsuits, and enforcement actions related to antitrust, data privacy, and AI. Violations of applicable laws—even unintentional ones—can result in significant fines, criminal sanctions, reputational damage, and restrictions on business operations. For example, the EU’s Digital Services Act allows for fines of up to 6% of global revenue for non-compliance[4].\n- **Impact on Innovation and Market Position** \n Regulatory restrictions on AI technologies, data usage, and advertising practices can limit Alphabet’s ability to innovate and maintain its competitive edge. Compliance burdens may also slow down the deployment of new systems and reduce the number of new entrants or customers in certain markets, potentially harming financial results[4].\n- **Reputational and Liability Risks** \n The development and use of AI, as well as issues related to harmful content and data privacy, expose Alphabet to reputational harm and increased liability. The company must continuously adapt to evolving legal standards and public expectations in these areas[4].\n- **Global and Geopolitical Considerations** \n Changes in trade policies, export controls, and geopolitical tensions—especially concerning AI-related hardware and software—can further complicate Alphabet’s operations. Restrictions on exports of GPUs and other technologies may limit the company’s ability to serve global customers and partners[4].\n\n**Summary Table: Regulatory Impact on Alphabet Inc.**\n\n| Regulatory Area | Impact on Operations & Risks |\n|------------------------|----------------------------------------------------------------------------------------------|\n| AI | Increased compliance costs, operational challenges, liability, and reputational risks |\n| Competition | Antitrust investigations, fines, restrictions on business practices, market position risks |\n| Consumer Protection | Compliance costs, changes to products/services, legal and reputational risks |\n| Content Moderation | Operational complexity, reputational risks, legal liability |\n| Data Privacy | Compliance costs, restrictions on data usage, legal and reputational risks |\n| News | Regulatory uncertainty, potential restrictions on content and partnerships |\n| Sustainability | Compliance costs, reputational risks, operational adjustments |\n\n**Conclusion**\n\nAlphabet Inc. is operating in a highly dynamic and uncertain regulatory environment. The company’s ability to manage these risks is critical to its ongoing success, but evolving and inconsistent regulations across jurisdictions present ongoing challenges to its business operations, financial results, and strategic initiatives for the fiscal year ended December 31, 2024[4].",,,,,Expecting value: line 1 column 1 (char 0)
4,"How does Meta Platforms, Inc. address the limitations and risks associated with forward-looking statements and the use of non-GAAP financial measures in its financial results for the fourth quarter and full year 2024?",442; 446; 449; 448; 447,"I don't know based on the provided document. The search results do not explicitly address how Meta Platforms, Inc. handles the limitations and risks associated with forward-looking statements and the use of non-GAAP financial measures in its financial results for the fourth quarter and full year 2024. However, general information about forward-looking statements typically includes discussions of risks and uncertainties, which can be found in SEC filings and investor relations materials[1][2][3]. For specific details, referring to Meta's official financial reports or press releases for that period would be necessary.",5.0,5.0,5.0,"The answer correctly states that the provided document does not explicitly address how Meta Platforms, Inc. manages the limitations and risks related to forward-looking statements and non-GAAP measures for Q4 and full year 2024. It also appropriately references general information from the cited search results about the presence of risk and uncertainty disclosures in Meta's SEC filings and financial reports, accurately reflecting the given data. The response is clear and precise in explaining the absence of direct information and suggests where such details are typically found.",
5,"What exhibits related to Netflix, Inc.’s fiscal year ended December 31, 2024, are included in the annual report, and what types of certifications and plans are filed with the SEC as part of this report?",453; 520; 521; 533; 534,"Based on the provided context, the exhibits included in Netflix, Inc.'s annual report for the fiscal year ended December 31, 2024, are listed as follows:\n\n- **EX-31.3**: Certification of the Chief Financial Officer pursuant to Section 302 of the Sarbanes-Oxley Act of 2002.\n- Other exhibits mentioned include **EX-19.1**, **EX-21.1**, **EX-23.1**, **EX-31.1**, **EX-31.2**, and **EX-32.1**.\n\nAs for certifications, the report includes those from the Co-Chief Executive Officers and the Chief Financial Officer under Sections 302 and 906 of the Sarbanes-Oxley Act of 2002.\n\nRegarding plans filed with the SEC, the context mentions the Netflix, Inc. 2020 Stock Plan and the Executive Officer Severance Plan.\n\nFor more detailed information on specific exhibits and plans, one would need to refer to the actual SEC filings or the annual report itself.",5.0,5.0,5.0,"The answer correctly identifies the exhibits related to Netflix's fiscal year ended December 31, 2024, including the certifications under Sections 302 and 906 of the Sarbanes-Oxley Act and mentions specific plans such as the 2020 Stock Plan and Executive Officer Severance Plan as filed with the SEC. It fully addresses both parts of the question clearly and comprehensively.",
6,"How have new US export control restrictions in 2024 negatively impacted NVIDIA Corporation's competitive position compared to certain competitors, and what specific risks do these controls pose for its future business and results in the China market and beyond?",662; 654; 653; 585; 637,"The new US export control restrictions in 2024 have negatively impacted NVIDIA Corporation's competitive position in several significant ways, particularly in the China market and beyond:\n\n### Negative Impact on NVIDIA's Competitive Position\n\n- **Restricted Sales of Key AI Chips**: The US government imposed export controls that restrict NVIDIA's ability to sell certain advanced AI chips, including the H20 chip designed specifically for the Chinese market. This chip now requires a special license for indefinite future sales in China, which has not been granted, leading to shipment delays and lost sales opportunities[2][3][5].\n\n- **Financial Impact**: NVIDIA has projected a $5.5 billion financial impact related to inventory, purchase commitments, and reserves tied to the H20 chip line due to these export controls. This sizable charge reflects the direct cost of restricted sales and excess inventory[2][3].\n\n- **Competitive Disadvantage**: Competitors who sell products not subject to these US restrictions or who can more easily acquire licenses gain a competitive advantage. The licensing process for NVIDIA is complicated, time-consuming, and uncertain, which discourages customers in China from purchasing NVIDIA products and encourages them to seek alternatives from semiconductor suppliers based in China, Europe, and Israel[Context].\n\n- **Supply Chain and Distribution Disruptions**: The controls also restrict gaming GPUs and networking products, potentially disrupting NVIDIA's supply and distribution chains, including those warehoused in Hong Kong. This disruption further harms NVIDIA's ability to serve demand efficiently[Context].\n\n- **Customer and Market Shifts**: Due to the cumbersome licensing and compliance requirements, customers in China and other affected regions may switch to competitors' products to avoid compliance burdens. Additionally, customers outside China might redesign their systems to exclude US semiconductors, further eroding NVIDIA's market share globally, including in Europe, Latin America, and Southeast Asia[Context].\n\n### Specific Risks for Future Business and Results\n\n- **Exclusion from Key Markets**: The export controls risk excluding NVIDIA from all or part of the China market and other impacted markets such as the Middle East. This exclusion could substantially reduce NVIDIA's revenue from these regions[Context].\n\n- **Increased Compliance Costs and Operational Complexity**: Managing licenses and compliance requirements is complicated and time-consuming, increasing operational costs and creating uncertainty in pre-sale and post-sale technical support. This complexity may harm customer relationships and future sales[Context].\n\n- **Potential for Further Restrictions**: Given the strategic importance of AI and geopolitical tensions, the US government may further tighten export controls, expanding the range of products subject to restrictions. This could prevent NVIDIA from selling existing inventory or developing replacement products not subject to licensing, further harming its competitive position and financial results[Context].\n\n- **Supply Chain Risks**: The need to transition some operations out of China and Hong Kong to comply with export controls is costly and time-consuming, potentially disrupting research, development, supply, and distribution operations during transition periods[Context].\n\n- **Impact on Research and Development**: Additional export restrictions may include deemed export control limitations that could negatively impact NVIDIA's ability to execute its research and development roadmap in a timely manner, affecting innovation and future product development[Context].\n\n- **Broader Market Impact**: Export controls not only affect sales in China but also could provoke retaliatory measures from foreign governments, negatively impacting NVIDIA's supply chain and ability to serve customers worldwide[Context].\n\nIn summary, the 2024 US export control restrictions have materially harmed NVIDIA's competitive position by limiting its ability to sell key AI chips in China, increasing operational and compliance burdens, disrupting supply chains, and encouraging customers to turn to less restricted competitors. These controls pose significant risks to NVIDIA's future business and financial results both in China and globally, with the potential for further deterioration if export controls expand or licenses are delayed or denied[Context][2][3][5].",5.0,5.0,5.0,"The answer is fully accurate, details all key impacts and risks, and is clearly structured with no major omissions or errors relative to the document chunk.",
7,"What were the key components and figures of Oracle Corporation's consolidated statements of cash flows for the fiscal year ended May 31, 2024, including net income, operating cash flows, investing activities, and financing activities?",831; 837; 835; 829; 832,"Here are the key components and figures of Oracle Corporation's consolidated statements of cash flows for the fiscal year ended May 31, 2024, based on the available information:\n\n## Key Components and Figures\n\n- **Net Income**: $10,467 million[2].\n- **Operating Cash Flows**: Net cash provided by operating activities was $18,700 million (reported as $18.7 billion) during fiscal year 2024, up 9% in USD[1][2].\n - **Adjustments to Reconcile Net Income to Net Cash Provided by Operating Activities**:\n - **Depreciation**: $3,129 million\n - **Amortization of Intangible Assets**: $3,010 million\n - **Deferred Income Taxes**: $(2,139) million\n - **Stock-Based Compensation**: $3,974 million\n - **Other, Net**: $720 million\n - **Changes in Operating Assets and Liabilities**:\n - **Increase in Trade Receivables, Net**: $(965) million\n - **Decrease in Prepaid Expenses and Other Assets**: $542 million\n - **Decrease in Accounts Payable and Other Liabilities**: $(594) million\n - **Decrease in Income Taxes Payable**: $(127) million\n - **Increase in Deferred Revenues**: $656 million[2].\n\nFor **Investing Activities** and **Financing Activities**, the provided context does not include detailed figures. However, the following information is available:\n\n- **Investing Activities**: The context does not provide specific figures for investing activities like purchases of marketable securities, proceeds from sales and maturities, acquisitions, or capital expenditures for the fiscal year ended May 31, 2024.\n- **Financing Activities**: Similarly, detailed figures for financing activities such as payments for repurchases of common stock, proceeds from issuances of common stock, payments of dividends, and repayments of senior notes are not explicitly stated in the context.\n\nTo obtain comprehensive details on investing and financing activities, one would need to refer to the full financial statements.",5.0,4.0,5.0,"The answer accurately presents key figures for net income and operating cash flows including detailed adjustments and changes in operating assets and liabilities, all consistent with the document chunk. It correctly notes the absence of specific investing and financing activities data in the provided context. The explanation is clear and well-structured, but completeness is slightly impacted by the lack of detailed investing and financing activities, which the answer appropriately acknowledges.",
8,"What risks does Reddit, Inc. identify in its 2024 fiscal year report related to the dependency on its senior management team and key employees, particularly concerning CEO Steven Huffman?",985; 922; 958; 929,"I don't know based on the provided documents. The context does not specifically mention risks related to the dependency on Reddit's senior management team, particularly concerning CEO Steven Huffman. However, it does mention a general risk related to the ability to identify, recruit, hire, and retain skilled personnel, including key members of senior management[5].",5.0,4.0,5.0,"The answer correctly states that the provided documents do not specifically mention risks related to dependency on senior management or CEO Steven Huffman but do mention general risks about hiring and retaining key personnel[5]. However, it could be slightly more complete by explicitly noting that the risk is general and not specifically linked to the CEO or senior management team as the question asks.",
9,"What was the main reason for the increase in net cash provided by operating activities for Tesla, Inc. during the fiscal year ended December 31, 2024?",416; 1098; 1086; 1091; 1093,"The main reason for the increase in net cash provided by operating activities for Tesla, Inc. during the fiscal year ended December 31, 2024, was primarily due to favorable changes in net operating assets and liabilities, which contributed approximately $2.29 billion. This positive effect was partially offset by a decrease in net income excluding non-cash expenses, gains, and losses of about $623 million. Overall, these factors led to an increase of $1.67 billion in net cash provided by operating activities, rising from $13.26 billion in 2023 to $14.92 billion in 2024[2].",2.0,2.0,4.0,"The answer claims a specific breakdown of asset/liability changes and net income impact not referenced in the chunk, and misrepresents the scale and cause of cash flow change seen in the documents, which only show general increases without such details.",


## MODEL 2

In [20]:
from user_models.example_1.model import qa, finalize
from user_models.createplot import plot
from user_models.example_2.qa import QA2
from user_models.evaluate import evaluate_answer

df2 = qa(QA2)
final_df2 = finalize(evaluate_answer, df2)

ImportError: cannot import name 'QA2' from 'user_models.example_2.qa' (c:\Users\alice\perplexity_hack\user_models\example_2\qa.py)

In [None]:
final_df2.head(10)

Unnamed: 0,question,top_k_chunk,answer,evaluation_factual_correctness_score,evaluation_completeness_score,evaluation_clarity_score,evaluation_comments
0,"How could challenges in hiring, retaining, and...",27; 1; 39,"Challenges in hiring, retaining, and managing ...",5,5,5,The answer thoroughly addresses how challenges...
1,What was the total lease liability for Apple I...,154; 386; 157,"As of September 28, 2024, Apple Inc. had fixed...",2,2,5,The answer correctly states the total lease li...
2,What are the key competitive challenges Cisco ...,321; 293; 248,"In 2024, Cisco faced several key competitive c...",4,4,5,"The answer is largely accurate, but lacks spec..."
3,Based on the Alphabet Inc. fiscal year ended D...,528; 527; 497,For Alphabet Inc. in the fiscal year ended Dec...,2,3,4,The answer provides specific per-share figures...
4,What were the key financial results reported b...,544; 552; 549,Here are the key financial results reported by...,4,4,5,"Most facts are correct and sourced, but there ..."
5,What operational and strategic challenges did ...,610; 609; 617,"Based on the available information, Netflix fa...",5,4,5,The answer correctly identifies all major oper...
6,"Question: \r\nWhere, as required by law, does...",768; 660; 723,NVIDIA Corporation files lobbying disclosure r...,5,5,5,The answer correctly states that NVIDIA files ...
7,What highlights or key financial metrics are i...,1022; 886; 1018,Oracle Corporation's fiscal year 2024 Form 10-...,5,5,5,The answer accurately presents key financial h...
8,"How does Reddit, Inc. plan to manage the poten...",1121; 1133; 1120,"Reddit, Inc. acknowledges the risk of user dec...",2,1,3,The model answer presents a comprehensive and ...
9,"Which Tesla, Inc. executives signed the compan...",1337; 1425; 1250,"The following Tesla, Inc. executives and direc...",5,5,5,"The model answer accurately lists all Tesla, I..."


In [None]:
plot(final_df2)