In [3]:
import logging
import traceback


# Set up logging configuration before importing other modules
logging.basicConfig(
    level=logging.DEBUG,
    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
    handlers=[
        logging.FileHandler("../../app.log", mode='w'),
        logging.StreamHandler()
    ]
)

# Imports
- the tech we will be using

In [4]:
from gensphere import genflow, yaml_utils
from gensphere.genflow import GenFlow
from gensphere.yaml_utils import YamlCompose
from gensphere.visualizer import Visualizer
from gensphere.hub import Hub
from dotenv import load_dotenv
import os

In [None]:
# Load environment variables from .env file
load_dotenv()

# Get environment variables
GROQ_API_KEY = os.getenv("GROQ_API_KEY")
HUGGINGFACE_API_KEY = os.getenv("HUGGINGFACE_API_KEY")
OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
OPENROUTER_API_KEY = os.getenv("OPENROUTER_API_KEY")
COMPOSIO_API_KEY = os.getenv("COMPOSIO_API_KEY")
FIRECRAWL_API_KEY = os.getenv("FIRECRAWL_API_KEY")

# Objetive
- Create workflow that automatically finds latest latest papers from Paper With Code, explores their abstract, and attempts to develop a new startup idea based on that

In [5]:
# Visualisation
viz=Visualizer('papers_with_code_analyzer.yaml',
               'gensphere_functions.py',
               'structured_output_schema.py',
               address='127.0.0.1', port=8050)
viz.start_visualization()

2024-11-25 08:56:39,196 - gensphere.graph_builder - INFO - Total elements generated: 11
2024-11-25 08:56:39,234 - urllib3.connectionpool - DEBUG - Starting new HTTP connection (1): 127.0.0.1:8050
2024-11-25 08:56:39,238 - urllib3.connectionpool - DEBUG - http://127.0.0.1:8050 "GET /_alive_60f7037a-1cfb-4f02-b361-5aff434ee240 HTTP/11" 200 5


In [9]:
composer=YamlCompose('startup_idea_evaluator.yaml',
                     'gensphere_functions.py',
                     'structured_output_schema.py')
combined_yaml_data=composer.compose(save_combined_yaml=True, output_file='combined.yaml')

2024-11-25 09:12:53,812 - gensphere.yaml_utils - INFO - Starting composition with root YAML file 'd:\CODING\LOCAL\ai\PERSONAL PROJECTS\projectGensphere\src\papers_with_code\startup_idea_evaluator.yaml'
2024-11-25 09:12:53,813 - gensphere.yaml_utils - INFO - Checking for YAML file 'd:\CODING\LOCAL\ai\PERSONAL PROJECTS\projectGensphere\src\papers_with_code\startup_idea_evaluator.yaml' consistency
2024-11-25 09:12:53,815 - gensphere.yaml_utils - DEBUG - Validating YAML file 'd:\CODING\LOCAL\ai\PERSONAL PROJECTS\projectGensphere\src\papers_with_code\startup_idea_evaluator.yaml'
2024-11-25 09:12:53,825 - gensphere.yaml_utils - DEBUG - Validating YAML file 'd:\CODING\LOCAL\ai\PERSONAL PROJECTS\projectGensphere\src\papers_with_code\papers_with_code_analyzer.yaml'
2024-11-25 09:12:53,828 - composio - INFO - Logging is set to INFO, use `logging_level` argument or `COMPOSIO_LOGGING_LEVEL` change this
2024-11-25 09:12:53,838 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): ba

In [10]:
logging.getLogger('composio').setLevel(logging.WARNING)
logging.getLogger('gensphere').setLevel(logging.DEBUG)
logging.getLogger('GenFlow').setLevel(logging.DEBUG)

In [13]:
flow=GenFlow('combined.yaml',
             'gensphere_functions.py',
             'structured_output_schema.py')
flow.parse_yaml()
flow.run()

2024-11-25 09:18:10,356 - httpx - DEBUG - load_ssl_context verify=True cert=None trust_env=True http2=False
2024-11-25 09:18:10,357 - httpx - DEBUG - load_verify_locations cafile='d:\\CODING\\LOCAL\\ai\\PERSONAL PROJECTS\\projectGensphere\\.venv\\Lib\\site-packages\\certifi\\cacert.pem'
2024-11-25 09:18:10,371 - gensphere.yaml_utils - DEBUG - Validating YAML file 'd:\CODING\LOCAL\ai\PERSONAL PROJECTS\projectGensphere\src\papers_with_code\combined.yaml'
2024-11-25 09:18:10,385 - urllib3.connectionpool - DEBUG - Starting new HTTPS connection (1): backend.composio.dev:443
2024-11-25 09:18:10,845 - urllib3.connectionpool - DEBUG - https://backend.composio.dev:443 "GET /api/v1/connectedAccounts?user_uuid=default&showActiveOnly=true HTTP/11" 200 None
2024-11-25 09:18:13,090 - urllib3.connectionpool - DEBUG - https://backend.composio.dev:443 "GET /api/v2/actions?apps=firecrawl HTTP/11" 200 None
2024-11-25 09:18:13,318 - urllib3.connectionpool - DEBUG - https://backend.composio.dev:443 "GET /a

In [14]:
flow.outputs

{'read_idea': {'domains': 'startup that creates integrate web3 using generative AI. The business model would be B2C.\n'},
 'papers_with_code_analyzer__get_current_date': {'current_date': '2024-11-25'},
 'papers_with_code_analyzer__get_timewindow': {'time_window': 'past day'},
 'papers_with_code_analyzer__papers_with_code_scrape': {'papers_with_code_latest_research_articles': 'I retrieved the latest papers from Papers With Code that were published in the last day from November 2024. Here are some of the notable ones:\n\n1. **[Enhancing person re-identification via Uncertainty Feature Fusion Method and Auto-weighted Measure Combination](https://paperswithcode.com/paper/enhancing-person-re-identification-via-1)**\n   - Authors: [GitHub Link](https://github.com/chequanghuy/Enhancing-Person-Re-Identification-via-UFFM-and-AMC)\n\n2. **[FedMLLM: Federated Fine-tuning MLLM on Multimodal Heterogeneity Data](https://paperswithcode.com/paper/fedmllm-federated-fine-tuning-mllm-on)**\n   - Authors:

In [15]:
#Visualize final output node
final_node_output=flow.outputs.get("generate_report").get("report")

from IPython.display import display, Markdown
display(Markdown(final_node_output))

```markdown
# VC Analyst Report: Web3 and Generative AI Startup Analysis

## 1. Overview of the Latest Papers on Paperswithcode.com

The startup idea proposes the integration of Web3 with generative AI to create a B2C application. Here's a brief overview of the recent research papers and their potential applicability to the startup:

- **Enhancing Person Re-Identification via Uncertainty Feature Fusion Method and Auto-weighted Measure Combination**: Focuses on identity detection with uncertainty measures, which might be useful for applications involving user identities within web3 platforms, enhancing security and personalization.

- **FedMLLM: Federated Fine-tuning MLLM on Multimodal Heterogeneity Data**: This paper discusses federated learning and tapping into private data sources across modalities. This is crucial for handling diverse and private data in decentralized Web3 apps.

- **Cosmological Analysis with Calibrated Neural Quantile Estimation and Approximate Simulators**: Not directly applicable for consumer web applications but introduces computational techniques for scalable data analysis which could inspire backend frameworks.

- **Large Multi-modal Models Can Interpret Features in Large Multi-modal Models**: Provides insights into decoding complex neural representations. Could assist in understanding and personalizing user interactions within Web3 applications.

- **Cross-Modal Pre-Aligned Method with Global and Local Information for Remote-Sensing Image and Text Retrieval**: Offers retrieval methods for textual and visual data, which could help in building intelligent search features within Web3 applications.

- **Multiset Transformer: Advancing Representation Learning in Persistence Diagrams**: While more theoretical, it provides advanced data representation techniques, potentially useful in blockchain data operations.

- **Geminio: Language-Guided Gradient Inversion Attacks in Federated Learning**: Discusses privacy attacks which are crucial to consider for security in any Web3 application.

- **AttriBoT: A Bag of Tricks for Efficiently Approximating Leave-One-Out Context Attribution**: Proposes methods for data contextualization which could enhance personalized experiences in consumer apps.

### Best Paper for Startup Application
Given the startup's focus, **FedMLLM** appears most valuable, addressing the need for private, heterogeneous data handling which is key for consumer trust in B2C Web3 applications.

## 2. List of Potential Competitors

- **ConsenSys**: Known for its Ethereum-based software and development suite, it could leverage generative AI for enhanced user interactions.
  
- **Chainlink**: Focuses on data integration from off-chain to on-chain, potentially augmenting Web3 experiences with AI-driven content creation.
  
- **Fetch.ai**: A platform providing a system for autonomous machine-to-machine ecosystem backed by AI which may overlap the startup's vision.
  
- **Ocean Protocol**: They aim to unlock data, primarily for AI models. Their framework could be extended to generative applications in Web3, posing a competitive threat.

### Rationale
These companies focus on integrating advanced AI with decentralized technologies, aligning closely with the proposed startup’s vision.

## 3. Promising Research Papers

The following papers indicate potential for significant user onboarding by addressing crucial pain points:

1. **FedMLLM**: As mentioned, valuable for developing private and secure consumer applications by leveraging federated learning.
  
2. **Cross-Modal Pre-Aligned Method**: Useful for enhancing user retrieval experiences in applications that could integrate varied data sources.
  
3. **Enhancing Person Re-Identification**: For startups aiming to include identity verification features, this provides methods for enhancing security with generative techniques.

## 4. Table of Latest Research Papers

| Paper Title                                                                                             | Release Date | Key Insights                                                                                                              | Potential Application                       |
|---------------------------------------------------------------------------------------------------------|--------------|---------------------------------------------------------------------------------------------------------------------------|---------------------------------------------|
| Enhancing Person Re-Identification via Uncertainty Feature Fusion Method and Auto-weighted Measure Combination  | Nov 2024     | Identity detection with uncertainty; improves security                                                                   | User identity within Web3 platforms        |
| FedMLLM: Federated Fine-tuning MLLM on Multimodal Heterogeneity Data                                          | Nov 2024     | Federated learning with private data; enhances utility in handling heterogeneous data                                     | Secure and private data handling in apps   |
| Cosmological Analysis with Calibrated Neural Quantile Estimation and Approximate Simulators                    | Nov 2024     | Advanced data inference and computation                                                                                   | Backend frameworks for scalable operations |
| Large Multi-modal Models Can Interpret Features in Large Multi-modal Models                                    | Nov 2024     | Complex neural representation understanding                                                                               | Personalization in user interactions       |
| Cross-Modal Pre-Aligned Method with Global and Local Information for Remote-Sensing Image and Text Retrieval    | Nov 2024     | Integrates retrieval systems for images and text                                                                          | Intelligent search in apps                 |
| Multiset Transformer: Advancing Representation Learning in Persistence Diagrams                                 | Nov 2024     | Enhanced data representation techniques                                                                                   | Blockchain data operations                 |
| Geminio: Language-Guided Gradient Inversion Attacks in Federated Learning                                       | Nov 2024     | New attack methods in federated learning; crucial for security                                                             | Security considerations in Web3 apps       |
| AttriBoT: A Bag of Tricks for Efficiently Approximating Leave-One-Out Context Attribution                       | Nov 2024     | Efficient data contextualization                                                                                          | Personalized app experiences               |

This analysis positions the startup to leverage cutting-edge research to build a compelling Web3 application that can successfully penetrate the consumer market.
```

This markdown report should render smoothly in a Jupyter Notebook, providing a comprehensive overview with clear sections, tables, and explanations directly aligned with the startup's proposed direction in the field of web3 and generative AI.