In [5]:
# Huggingface models
overall_temperature = 0.1

from langchain import PromptTemplate, HuggingFaceHub, LLMChain

flan_20B = HuggingFaceHub(repo_id = 'google/flan-ul2',
                          model_kwargs={'temperature': overall_temperature,
                                        'max_new_tokens': 200})

flan_t5xxl = HuggingFaceHub(repo_id='google/flan-t5-xxl',
                            model_kwargs={'temperature': overall_temperature,
                                          'max_new_tokens': 200})

gpt_j6B = HuggingFaceHub(repo_id='EleutherAI/gpt-j-6B',
                         model_kwargs={'temperature': overall_temperature,
                                       'max_new_tokens': 100})

In [6]:
# OpenAI models
from langchain.llms import OpenAI, OpenAIChat

chatGPT_turbo = OpenAIChat(model_name = 'gpt-3.5-turbo',
                           temperature = overall_temperature,
                           max_tokens = 256)

gpt3_davinci_003 = OpenAI(model_name='text-davinci-003',
                          temperature=overall_temperature,
                          max_tokens = 256)

In [7]:
# # Cohere models
# from langchain.llms import Cohere

# cohere_command_xl = Cohere(model = 'command-xlarge',
#                            temperature=overall_temperature,
#                            max_tokens=256)

# cohere_command_xl_nightly = Cohere(model='command-xlarge-nightly',
#                                    temperature=0.1,
#                                    max_tokens=256)


In [14]:
# comparison lab

from langchain.model_laboratory import ModelLaboratory
from langchain.prompts import PromptTemplate

template = """Question: {question}

Answer: Let's think step by step."""

prompt = PromptTemplate(template=template, input_variables=['question'])

lab = ModelLaboratory.from_llms([chatGPT_turbo,
                                 gpt3_davinci_003,
                                #  gpt_j6B,
                                 flan_20B,
                                 flan_t5xxl
                                 ]
                                 , prompt = prompt)

lab.compare('What is the oppisite of up?')

[1mInput:[0m
What is the oppisite of up?

[1mOpenAIChat[0m
Params: {'model_name': 'gpt-3.5-turbo', 'temperature': 0.1, 'max_tokens': 256}
[36;1m[1;3mThe opposite of up is down.[0m

[1mOpenAI[0m
Params: {'model_name': 'text-davinci-003', 'temperature': 0.1, 'max_tokens': 256, 'top_p': 1, 'frequency_penalty': 0, 'presence_penalty': 0, 'n': 1, 'request_timeout': None, 'logit_bias': {}}
[33;1m[1;3m The opposite of up is down.[0m

[1mHuggingFaceHub[0m
Params: {'repo_id': 'google/flan-ul2', 'task': None, 'model_kwargs': {'temperature': 0.1, 'max_new_tokens': 200}}
[38;5;200m[1;3mUp is the opposite of down. Down is below up. Up is on top of down. The answer: down.[0m

[1mHuggingFaceHub[0m
Params: {'repo_id': 'google/flan-t5-xxl', 'task': None, 'model_kwargs': {'temperature': 0.1, 'max_new_tokens': 200}}
[32;1m[1;3mDown is the opposite of up. Down is the opposite of up. The answer: down.[0m



In [11]:
lab.compare('Answer the following question by reasoning step by step. The cafeteria had 23 apples. If they used 20 for lunch, and bought 6 more, how many apples do they have?')

[1mInput:[0m
Answer the following question by reasoning step by step. The cafeteria had 23 apples. If they used 20 for lunch, and bought 6 more, how many apples do they have?

[1mOpenAIChat[0m
Params: {'model_name': 'gpt-3.5-turbo', 'temperature': 0.1, 'max_tokens': 256}
[36;1m[1;3mStep 1: The cafeteria had 23 apples.
Step 2: They used 20 apples for lunch.
Step 3: To find out how many apples they have left, we subtract the number of apples used from the initial number of apples: 23 - 20 = 3.
Step 4: The cafeteria bought 6 more apples.
Step 5: To find out how many apples they have now, we add the number of apples they had left after lunch to the number of apples they bought: 3 + 6 = 9.
Step 6: Therefore, the cafeteria now has 9 apples.[0m

[1mOpenAI[0m
Params: {'model_name': 'text-davinci-003', 'temperature': 0.1, 'max_tokens': 256, 'top_p': 1, 'frequency_penalty': 0, 'presence_penalty': 0, 'n': 1, 'request_timeout': None, 'logit_bias': {}}
[33;1m[1;3m 

Step 1: The cafeteria

In [15]:
lab.compare("""
Can Geoffrey Hinton have a conversation with George Washington? Give the rationale before answering.
""")

[1mInput:[0m

Can Geoffrey Hinton have a conversation with George Washington? Give the rationale before answering.


[1mOpenAIChat[0m
Params: {'model_name': 'gpt-3.5-turbo', 'temperature': 0.1, 'max_tokens': 256}
[36;1m[1;3mFirst, we need to consider the fact that Geoffrey Hinton is a renowned computer scientist and one of the pioneers of deep learning and artificial intelligence. On the other hand, George Washington was the first President of the United States and lived during the 18th century.

Given this information, it is clear that Geoffrey Hinton and George Washington belong to different time periods. Hinton is a contemporary figure, while Washington lived over two centuries ago. Therefore, it is impossible for them to have a direct conversation in the traditional sense.

However, if we consider the hypothetical scenario of time travel or some advanced technology that allows communication across time periods, it might be possible for Hinton and Washington to exchange inform

In [17]:
template = """
You are a creative story teller who can write wonderful interesting short stories: {question}

Story:
"""

prompt = PromptTemplate(template=template, input_variables=['question'])

lab = ModelLaboratory.from_llms([chatGPT_turbo,
                                 gpt3_davinci_003,
                                #  gpt_j6B,
                                 flan_20B,
                                 flan_t5xxl
                                 ]
                                 , prompt = prompt)

lab.compare("""
Write a sad story about a carrot named Jason. The story should start with the carrot being a professional athlete of some kind, and end with the carrot having his heart broken.
""")

[1mInput:[0m

Write a sad story about a carrot named Jason. The story should start with the carrot being a professional athlete of some kind, and end with the carrot having his heart broken.


[1mOpenAIChat[0m
Params: {'model_name': 'gpt-3.5-turbo', 'temperature': 0.1, 'max_tokens': 256}
[36;1m[1;3mOnce upon a time, in the vibrant land of Veggieville, there lived a carrot named Jason. Jason was not your ordinary carrot; he possessed an extraordinary talent for running. With his slender body and vibrant orange hue, he had become a professional athlete, competing in the prestigious Veggie Games.

Jason had always dreamt of becoming a champion, and his hard work and dedication had finally paid off. He had won numerous races, breaking records and capturing the hearts of the vegetable community. His speed was unmatched, and he was adored by fans far and wide.

One sunny day, as Jason was preparing for his next race, he noticed a beautiful tomato named Lily in the crowd. Her radiant re

In [22]:
template = """Answer the question to the best of your abilities but if you are not sure then answer you don't know: {question}

Answer:"""

prompt = PromptTemplate(template=template, input_variables=["question"])

lab = ModelLaboratory.from_llms([chatGPT_turbo,
                                 gpt3_davinci_003,
                                #  gpt_j6B,
                                 flan_20B,
                                 flan_t5xxl
                                 ]
                                 , prompt = prompt)

lab.compare("""
I am riding a bicycle. The pedals are moving fast. I look into the mirror and I am not moving. Why is this?
""")

[1mInput:[0m

I am riding a bicycle. The pedals are moving fast. I look into the mirror and I am not moving. Why is this?


[1mOpenAIChat[0m
Params: {'model_name': 'gpt-3.5-turbo', 'temperature': 0.1, 'max_tokens': 256}
[36;1m[1;3mI don't know.[0m

[1mOpenAI[0m
Params: {'model_name': 'text-davinci-003', 'temperature': 0.1, 'max_tokens': 256, 'top_p': 1, 'frequency_penalty': 0, 'presence_penalty': 0, 'n': 1, 'request_timeout': None, 'logit_bias': {}}
[33;1m[1;3m You are likely coasting, meaning you are not pedaling and the bike is still moving due to the momentum from your previous pedaling.[0m

[1mHuggingFaceHub[0m
Params: {'repo_id': 'google/flan-ul2', 'task': None, 'model_kwargs': {'temperature': 0.1, 'max_new_tokens': 200}}
[38;5;200m[1;3mI am stationary[0m

[1mHuggingFaceHub[0m
Params: {'repo_id': 'google/flan-t5-xxl', 'task': None, 'model_kwargs': {'temperature': 0.1, 'max_new_tokens': 200}}
[32;1m[1;3mI am looking at the wrong angle.[0m



In [25]:
template = """{question}

Answer:"""

prompt = PromptTemplate(template=template, input_variables=['question'])

lab = ModelLaboratory.from_llms([chatGPT_turbo,
                                 gpt3_davinci_003,
                                #  gpt_j6B,
                                 flan_20B,
                                 flan_t5xxl
                                 ]
                                 , prompt = prompt)

lab.compare('''Please answer the question:\n
Who is the OnePlus COO?\n\n
Output in the format: [first_name, surname]\n\n

Smartphone makers searched for a way forward at MWC 2023
Foldables, 6G, light shows -- there are a lot of ideas floating around, but no one has cracked the code
The slowdown was inevitable, of course. Nothing stays hot forever — especially in this industry. By tech standards, smartphones have had a good run, but the last few years have seen device makers searching for the magic bullet to help the sales slide reverse course. The arrival of 5G was a nice reprieve, but next-generation telecom standards don’t arrive every year.

“I personally think foldables are supply chain-driven innovation and not consumer insights,” Pei said. “Somebody invents OLED, and they can make a lot of money, because it’s a great technology. Then after a few years, a lot more companies make that, so they need to lower their prices. So they need to figure out what else they can sell at a higher margin. They develop flexible OLEDs, which they can sell at a higher price.”
It’s hard not to be cynical about this stuff sometimes. Ditto for concept devices, though as I noted in my “ode to weird tech” post, as someone who follows this stuff for a living, I’m a fan of weirdness for weirdness sake, be it the rollable Motorola Rizr screen or the OnePlus glowing cooling fluid. Certainly following the automotive industry’s lead of creating concept devices is a trend that is likely to only become more pervasive.

OnePlus COO Kinder Liu told me this week that gauging consumer interest is one of the “multiple reasons” his company is engaging with the concept. He added, “Also, we want to encourage continuous innovation inside our company.”

Pretty much everyone I engaged with this week echoed the sentiment that smartphones are in a rut. For the first time, however, it’s not a foregone conclusion that there’s a way of getting out.
''')

[1mInput:[0m
Please answer the question:

Who is the OnePlus COO?


Output in the format: [first_name, surname]



Smartphone makers searched for a way forward at MWC 2023
Foldables, 6G, light shows -- there are a lot of ideas floating around, but no one has cracked the code
The slowdown was inevitable, of course. Nothing stays hot forever — especially in this industry. By tech standards, smartphones have had a good run, but the last few years have seen device makers searching for the magic bullet to help the sales slide reverse course. The arrival of 5G was a nice reprieve, but next-generation telecom standards don’t arrive every year.

“I personally think foldables are supply chain-driven innovation and not consumer insights,” Pei said. “Somebody invents OLED, and they can make a lot of money, because it’s a great technology. Then after a few years, a lot more companies make that, so they need to lower their prices. So they need to figure out what else they can sell at a higher mar

In [26]:
lab.compare('''Please answer the question:\n
What is a supply chain driven innovation?\n\n

Smartphone makers searched for a way forward at MWC 2023
Foldables, 6G, light shows -- there are a lot of ideas floating around, but no one has cracked the code
The slowdown was inevitable, of course. Nothing stays hot forever — especially in this industry. By tech standards, smartphones have had a good run, but the last few years have seen device makers searching for the magic bullet to help the sales slide reverse course. The arrival of 5G was a nice reprieve, but next-generation telecom standards don’t arrive every year.

“I personally think foldables are supply chain-driven innovation and not consumer insights,” Pei said. “Somebody invents OLED, and they can make a lot of money, because it’s a great technology. Then after a few years, a lot more companies make that, so they need to lower their prices. So they need to figure out what else they can sell at a higher margin. They develop flexible OLEDs, which they can sell at a higher price.”
It’s hard not to be cynical about this stuff sometimes. Ditto for concept devices, though as I noted in my “ode to weird tech” post, as someone who follows this stuff for a living, I’m a fan of weirdness for weirdness sake, be it the rollable Motorola Rizr screen or the OnePlus glowing cooling fluid. Certainly following the automotive industry’s lead of creating concept devices is a trend that is likely to only become more pervasive.

OnePlus COO Kinder Liu told me this week that gauging consumer interest is one of the “multiple reasons” his company is engaging with the concept. He added, “Also, we want to encourage continuous innovation inside our company.”

Pretty much everyone I engaged with this week echoed the sentiment that smartphones are in a rut. For the first time, however, it’s not a foregone conclusion that there’s a way of getting out.
''')

[1mInput:[0m
Please answer the question:

What is a supply chain driven innovation?



Smartphone makers searched for a way forward at MWC 2023
Foldables, 6G, light shows -- there are a lot of ideas floating around, but no one has cracked the code
The slowdown was inevitable, of course. Nothing stays hot forever — especially in this industry. By tech standards, smartphones have had a good run, but the last few years have seen device makers searching for the magic bullet to help the sales slide reverse course. The arrival of 5G was a nice reprieve, but next-generation telecom standards don’t arrive every year.

“I personally think foldables are supply chain-driven innovation and not consumer insights,” Pei said. “Somebody invents OLED, and they can make a lot of money, because it’s a great technology. Then after a few years, a lot more companies make that, so they need to lower their prices. So they need to figure out what else they can sell at a higher margin. They develop flexible O