In [1]:
!pip install python-dotenv
!pip install openai



# Getting data from Mergeflow's API

In [5]:
import requests
import json
import os
from dotenv import load_dotenv # stores API keys for OpenAI and Mergeflow 

load_dotenv()  # Load variables from .env file
mergeflow_api_key = os.getenv('MERGEFLOW_API_KEY') # Assign Mergeflow API

# the API call
query = 'factory+automation' # topic is "large language model"factory automation
dataset = '&q=*%5bfundingcompany%7cfundingproject%7cfundingorganization%5d&sp=2572' # access dataset from mergeflow - in this case venture capital investments
rows = str(5) # first 5 docs only

# in the url below, replace "fw" by your user name. You can see your user name at mergeflow.net
# -> Account -> the string in angle brackets
url = 'https://mergeflow.net/api/v1/ferdinandk/search/getContent?q=' + query + dataset + '&rows=' + rows

# Define the headers to be sent with the request
headers = {
    'MergeflowNet-Api-Auth-Key': mergeflow_api_key
}

# Get and print the response
response = requests.post(url, headers=headers)

mergeflow_docs = []

# Check the response status code and content
if response.status_code == 200:
    mergeflow_response_json = response.json()
    
    # Pretty-print the JSON response -- useful to understand what the JSON looks like
    #pretty_json = json.dumps(mergeflow_response_json, indent=4)
    #print(pretty_json)
    
    # get title, URL, date, and content
    for document in mergeflow_response_json['Documents']:
        current_doc = {
            'title': document['Title'],
            'date': document['Date'],
            'url': document['Url'],
            'content': document['Content']
        }
        
        mergeflow_docs.append(current_doc)
        #print(content)        

    print('Found ' + str(len(mergeflow_docs)) + ' documents.')

else:
    print('Request failed with status code:', response.status_code)
    print(response.text)  # Print the response text


Found 5 documents.


# Answering questions on the results with OpenAI GPT

In [6]:
import openai

openai.api_key = os.getenv('OPENAI_API_KEY') # Assign OpenAI API

system_prompt = f"""You are the Chief Customer Officer of a company in the field of {query}. Your work is highly crucial and you are responsible for indentifiying the most significant problems of your customer."""
        
# Initialize an empty list to store problem messages
problems_list = []

for doc in mergeflow_docs: #stores all the problems in 1 string 
    user_prompt1 = f"""
    
    
    Consider the text below, delimited by ```, in the area of {query}:
    ```
    {doc['content']}
    ```    
   
    Take a deep breath before working on this problem. 
   
    You want to find pressing problems of your customers in the field of {query} which would be worth solving. You are business minded and want to come up with a problem which your team should focus on - as your customer would really appreciate a solution and pay for it. 
    
    For the problem you found, please only output the following (please write in total minimum 155 words): 
        - "Title": Title of the problem in max 5 words. 
        - "Explanation": The problem (please write 100-150 words)
        - "User group": Which user group is impacted by this problem the most (please write 10-30 words)
        - "Pain point": What is the specific pain point for this user group resulting from the problem (please write 40-50 words)
        
    """
    
    completion = openai.chat.completions.create(
        model="gpt-4-0125-preview",
        messages=[
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": user_prompt1}
        ],
        temperature=0.7,
        max_tokens=2000,
        top_p=0.95,
        frequency_penalty=0,
        presence_penalty=0,
        stop=None
    )
    
     # Append the completion message content to the problems_list
    problems_list.append(completion.choices[0].message.content)
    
    # This prints the content of the output in a more readable way
    print(completion.choices[0].message.content)
    print("\n---\n")  # This adds a separator between the content blocks for readability

- **Title**: Efficient Supply Chain Management

- **Explanation**: In the rapidly evolving landscape of factory automation and robotics, a pressing problem is the efficient management of supply chains, particularly for startups like Aniai that are in the process of scaling production capabilities. The challenge lies in establishing a stable production line while simultaneously ensuring that the supply chain is resilient, flexible, and capable of meeting fluctuating demands. This includes sourcing raw materials, managing inventory, coordinating with suppliers, and handling logistics in a way that minimizes delays and reduces costs. For companies aiming to expand globally, like Aniai with its plans for North American and global expansion, this challenge is magnified by the need to navigate different regulatory environments, cultural differences, and potential disruptions in international trade.

- **User group**: Startup Companies in Robotics and Automation

- **Pain point**: The primary

In [7]:
# Now, iterate over problems_list to rate each problem
rated_problems_list = []
for problem in problems_list:
    user_prompt2 = f"""
   
    Read the following problems which you got as input: {problems_list} 
    
    Before you give me any output, please rate the problems according to the following criteria. Please be very critical in your ratings and only give a 3 rating when it is very very very good:
        - Size of user group (how many of the mentioned customers exist) (1 = small target group, 2 = medium target group, 3 = large target group)
        - Relevancy of pain point to the specific industry of {query} and the respective user group (e.g., patty not relevant for factory automation) (1 = not relevant to users, 2 = medium relevant to users, 3 = very relevant to users)
        - How specific is the problem? (1 = very generic problem, 2 = medium generic, 3 = specific and not generic problem)

    Given the problem:
    {problem}

    Please repeat the name of the problem and then output the ratings and a one-sentence justification (max 20 words).
    Add up the three ratings you gave to an overall score out of 9.
    
    """
    
    completion = openai.chat.completions.create(
        model="gpt-4-0125-preview",
        messages=[
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": user_prompt2}
        ],
        temperature=0.7,
        max_tokens=2000,
        top_p=0.95,
        frequency_penalty=0,
        presence_penalty=0,
        stop=None
    )
    
    # Assume we store the rated problem details for later use
    rated_problems_list.append(completion.choices[0].message.content)

    # Print the rated problem for immediate feedback
    print(completion.choices[0].message.content)
    print("\n---\n")

**Problem: Efficient Supply Chain Management**

- Size of user group: 2 (Medium target group)
- Relevancy of pain point: 3 (Very relevant to users)
- How specific is the problem?: 2 (Medium generic)

**Justification**: Supply chain issues are common in robotics startups, highly relevant but somewhat broad in focus.

**Overall score**: 7/9

---

Title: Efficient Automation Integration

- Size of user group: 3 (Large target group)
- Relevancy of pain point: 3 (Very relevant to users)
- How specific is the problem: 2 (Medium specific)

Overall score: 8

Justification: Automation integration is critical across many sectors, highly relevant, but somewhat broad in scope.

---

**Title: Scalable Cell Therapy Manufacturing**

- Size of user group: 2 (Medium target group)
- Relevancy of pain point: 3 (Very relevant to users)
- How specific is the problem: 3 (Specific and not generic problem)

**Overall score: 8/9**

Justification: The cell therapy manufacturing challenge is highly relevant and 

In [8]:
#new agents to give best problem 

user_prompt3 = f"""

    Consider the following problems: {problems_list}
    Consider the corresponding ratings: {rated_problems_list}
    
    Please output the problem with the highest overall rating in the {rated_problems_list}, including the following bullet points: 
       - "Title": Title of the problem in max 5 words. 
        - "Explanation": The problem (please write 100-150 words)
        - "User group": Which user group is impacted by this problem the most (please write 10-30 words)
        - "Pain point": What is the specific pain point for this user group resulting from the problem (please write 40-50 words)
 
    """
    
completion = openai.chat.completions.create(
        model="gpt-4-0125-preview",
        messages=[
            {"role": "system", "content": system_prompt},
            {"role": "user", "content": user_prompt3}
        ],
        temperature=0.7,
        max_tokens=2000,
        top_p=0.95,
        frequency_penalty=0,
        presence_penalty=0,
        stop=None
    )


# Print the rated problem for immediate feedback
print(completion.choices[0].message.content)
print("\n---\n")


- **Title**: Scalable Cell Therapy Manufacturing

- **Explanation**: The production of cell therapies is experiencing pivotal challenges in scaling up to meet both clinical and commercial demands. The shift from manual, small-scale processes to automated, large-scale operations introduces complexities such as maintaining product quality, ensuring consistent processes, and adhering to strict regulatory standards. As therapies progress from clinical trials towards commercialization, the ability to efficiently scale production becomes essential. Unfortunately, many existing facilities lack the required flexibility and technological integration, creating bottlenecks that can delay product delivery and inflate costs.

- **User group**: Cell therapy manufacturers, especially those moving from clinical to commercial-scale production.

- **Pain point**: The main pain point for this group is the difficulty in efficiently scaling up production while adhering to regulatory standards and ensuring 